{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/home/donbr/aie3-bootcamp/arxiv-rag-mvp/.venv/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", " from .autonotebook import tqdm as notebook_tqdm\n" ] } ], "source": [ "from data_ingestion import run_ingestion_pipeline" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2024-07-06 09:04:10,909 - INFO - Fetching arXiv metadata for query: System of Agents\n", "2024-07-06 09:04:10,910 - INFO - Requesting page (first: True, try: 0): https://export.arxiv.org/api/query?search_query=System+of+Agents&id_list=&sortBy=submittedDate&sortOrder=descending&start=0&max_results=10\n", "2024-07-06 09:04:12,477 - INFO - Got first page: 10 of 2492622 total results\n", "2024-07-06 09:04:12,479 - INFO - Fetched metadata for 10 papers: [{'title': 'Planetarium: A Rigorous Benchmark for Translating Text to Structured Planning Languages', 'authors': ['Max Zuo', 'Francisco Piedrahita Velez', 'Xiaochen Li', 'Michael L. Littman', 'Stephen H. Bach'], 'published': '2024-07-03T17:59:53+00:00', 'updated': '2024-07-03T17:59:53+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03321v1', 'entry_id': 'http://arxiv.org/abs/2407.03321v1', 'summary': \"Many recent works have explored using language models for planning problems.\\nOne line of research focuses on translating natural language descriptions of\\nplanning tasks into structured planning languages, such as the planning domain\\ndefinition language (PDDL). While this approach is promising, accurately\\nmeasuring the quality of generated PDDL code continues to pose significant\\nchallenges. First, generated PDDL code is typically evaluated using planning\\nvalidators that check whether the problem can be solved with a planner. This\\nmethod is insufficient because a language model might generate valid PDDL code\\nthat does not align with the natural language description of the task. Second,\\nexisting evaluation sets often have natural language descriptions of the\\nplanning task that closely resemble the ground truth PDDL, reducing the\\nchallenge of the task. To bridge this gap, we introduce \\\\benchmarkName, a\\nbenchmark designed to evaluate language models' ability to generate PDDL code\\nfrom natural language descriptions of planning tasks. We begin by creating a\\nPDDL equivalence algorithm that rigorously evaluates the correctness of PDDL\\ncode generated by language models by flexibly comparing it against a ground\\ntruth PDDL. Then, we present a dataset of $132,037$ text-to-PDDL pairs across\\n13 different tasks, with varying levels of difficulty. Finally, we evaluate\\nseveral API-access and open-weight language models that reveal this task's\\ncomplexity. For example, $87.6\\\\%$ of the PDDL problem descriptions generated by\\nGPT-4o are syntactically parseable, $82.2\\\\%$ are valid, solve-able problems,\\nbut only $35.1\\\\%$ are semantically correct, highlighting the need for a more\\nrigorous benchmark for this problem.\"}, {'title': 'InternLM-XComposer-2.5: A Versatile Large Vision Language Model Supporting Long-Contextual Input and Output', 'authors': ['Pan Zhang', 'Xiaoyi Dong', 'Yuhang Zang', 'Yuhang Cao', 'Rui Qian', 'Lin Chen', 'Qipeng Guo', 'Haodong Duan', 'Bin Wang', 'Linke Ouyang', 'Songyang Zhang', 'Wenwei Zhang', 'Yining Li', 'Yang Gao', 'Peng Sun', 'Xinyue Zhang', 'Wei Li', 'Jingwen Li', 'Wenhai Wang', 'Hang Yan', 'Conghui He', 'Xingcheng Zhang', 'Kai Chen', 'Jifeng Dai', 'Yu Qiao', 'Dahua Lin', 'Jiaqi Wang'], 'published': '2024-07-03T17:59:21+00:00', 'updated': '2024-07-03T17:59:21+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03320v1', 'entry_id': 'http://arxiv.org/abs/2407.03320v1', 'summary': 'We present InternLM-XComposer-2.5 (IXC-2.5), a versatile large-vision\\nlanguage model that supports long-contextual input and output. IXC-2.5 excels\\nin various text-image comprehension and composition applications, achieving\\nGPT-4V level capabilities with merely 7B LLM backend. Trained with 24K\\ninterleaved image-text contexts, it can seamlessly extend to 96K long contexts\\nvia RoPE extrapolation. This long-context capability allows IXC-2.5 to excel in\\ntasks requiring extensive input and output contexts. Compared to its previous\\n2.0 version, InternLM-XComposer-2.5 features three major upgrades in\\nvision-language comprehension: (1) Ultra-High Resolution Understanding, (2)\\nFine-Grained Video Understanding, and (3) Multi-Turn Multi-Image Dialogue. In\\naddition to comprehension, IXC-2.5 extends to two compelling applications using\\nextra LoRA parameters for text-image composition: (1) Crafting Webpages and (2)\\nComposing High-Quality Text-Image Articles. IXC-2.5 has been evaluated on 28\\nbenchmarks, outperforming existing open-source state-of-the-art models on 16\\nbenchmarks. It also surpasses or competes closely with GPT-4V and Gemini Pro on\\n16 key tasks. The InternLM-XComposer-2.5 is publicly available at\\nhttps://github.com/InternLM/InternLM-XComposer.'}, {'title': \"`Interaction annealing' to determine effective quantized valence and orbital structure: an illustration with ferro-orbital order in WTe$_2$\", 'authors': ['Ruoshi Jiang', 'Fangyuan Gu', 'Wei Ku'], 'published': '2024-07-03T17:59:18+00:00', 'updated': '2024-07-03T17:59:18+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03319v1', 'entry_id': 'http://arxiv.org/abs/2407.03319v1', 'summary': \"Strongly correlated materials are known to display qualitatively distinct\\nemergent behaviors at low energy. Conveniently, the superposition principle of\\nquantum mechanics ensures that, upon absorbing quantum fluctuation, these rich\\nlow-energy behaviors can always be effectively described by dressed particles\\nwith fully quantized charge, spin, and orbitals structure. Such a powerful and\\nsimple description is, however, difficult to access through density functional\\ntheory (DFT) calculations, since in terms of bare particles the quantum\\nfluctuation would heavily smear the quantized quantities. To address this\\ndifficulty, we propose an `interaction annealing' approach to decipher the\\ndominant valence and orbital structure by suppressing the charge fluctuation\\nthrough enhancing ionic charging energy. Applying this approach to\\nferroelectric semi-metal WTe${_2}$ as a demonstration, we identify a dominant\\nferro-orbital ordered structure with W ion in a $d^2$ spin-0 configuration. The\\nproposed approach is straightforward to implement in standard DFT calculations\\nto grant additional access to essential low-energy physics.\"}, {'title': 'Fair Division of Indivisible Chores via Earning Restricted Equilibria', 'authors': ['Jugal Garg', 'Aniket Murhekar', 'John Qin'], 'published': '2024-07-03T17:58:22+00:00', 'updated': '2024-07-03T17:58:22+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03318v1', 'entry_id': 'http://arxiv.org/abs/2407.03318v1', 'summary': \"We study fair division of $m$ indivisible chores among $n$ agents with\\nadditive preferences. We consider the desirable fairness notions of\\nenvy-freeness up to any chore (EFX) and envy-freeness up to $k$ chores (EF$k$),\\nalongside the efficiency notion of Pareto optimality (PO). We present the first\\nconstant approximations of these notions, showing the existence of:\\n - 5-EFX allocations, which improve the best-known factor of $O(n^2)$-EFX.\\n - 3-EFX and PO allocations for the special case of bivalued instances, which\\nimprove the best-known factor of $O(n)$-EFX without any efficiency guarantees.\\n - 2-EF2 + PO allocations, which improve the best-known factor of EF$m$ + PO.\\n A notable contribution of our work is the introduction of the novel concept\\nof earning-restricted (ER) competitive equilibrium for fractional allocations,\\nwhich limits agents' earnings from each chore. Technically, our work addresses\\ntwo main challenges: proving the existence of an ER equilibrium and designing\\nalgorithms that leverage ER equilibria to achieve the above results. To tackle\\nthe first challenge, we formulate a linear complementarity problem (LCP)\\nformulation that captures all ER equilibria and show that the classic\\ncomplementary pivot algorithm on the LCP must terminate at an ER equilibrium.\\nFor the second challenge, we carefully set the earning limits and use\\nproperties of ER equilibria to design sophisticated procedures that involve\\nswapping and merging bundles to meet the desired fairness and efficiency\\ncriteria. We expect that the concept of ER equilibrium will be instrumental in\\nderiving further results on related problems.\"}, {'title': 'Quantum Geometry Probed by Chiral Excitonic Optical Response of Chern Insulators', 'authors': ['Wen-Xuan Qiu', 'Fengcheng Wu'], 'published': '2024-07-03T17:58:11+00:00', 'updated': '2024-07-03T17:58:11+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03317v1', 'entry_id': 'http://arxiv.org/abs/2407.03317v1', 'summary': 'We theoretically derive the sum rule for the negative first moment of the\\nabsorptive optical conductivity with excitonic effects and establish its\\nconnection to the quantum weight $K$ and Chern number $C$ of the ground state.\\nApplying this framework, we investigate the excitonic optical response of the\\nChern insulator at hole filling factor $\\\\nu=1$ in twisted bilayer MoTe$_2$. A\\nsingle chiral exciton state, which selectively absorbs circularly polarized\\nlight of a specific handedness, dominates the optical sum rule. The chiral\\nexciton state comprises two types of interlayer electron-hole transitions,\\nwhich cancel out the total out-of-plane dipole moment. The absorption spectrum\\nshows nearly perfect magnetic circular dichroism, which can be attributed to\\nthe nearly saturated bound $K \\\\ge |C|$ of the Chern insulator under study. Our\\nwork illustrates the potential of using excitonic optical responses to probe\\nquantum geometry encoded by $K$ and $C$.'}, {'title': 'An Upper Limit on the Photoproduction Cross Section of the Spin-Exotic $π_1(1600)$', 'authors': ['F. Afzal', 'C. S. Akondi', 'M. Albrecht', 'M. Amaryan', 'S. Arrigo', 'V. Arroyave', 'A. Asaturyan', 'A. Austregesilo', 'Z. Baldwin', 'F. Barbosa', 'J. Barlow', 'E. Barriga', 'R. Barsotti', 'D. Barton', 'V. Baturin', 'V. V. Berdnikov', 'T. Black', 'W. Boeglin', 'M. Boer', 'W. J. Briscoe', 'T. Britton', 'S. Cao', 'E. Chudakov', 'G. Chung', 'P. L. Cole', 'O. Cortes', 'V. Crede', 'M. M. Dalton', 'D. Darulis', 'A. Deur', 'S. Dobbs', 'A. Dolgolenko', 'M. Dugger', 'R. Dzhygadlo', 'D. Ebersole', 'M. Edo', 'H. Egiyan', 'T. Erbora', 'P. Eugenio', 'A. Fabrizi', 'C. Fanelli', 'S. Fang', 'J. Fitches', 'A. M. Foda', 'S. Furletov', 'L. Gan', 'H. Gao', 'A. Gardner', 'A. Gasparian', 'D. Glazier', 'C. Gleason', 'V. S. Goryachev', 'B. Grube', 'J. Guo', 'L. Guo', 'J. Hernandez', 'K. Hernandez', 'N. D. Hoffman', 'D. Hornidge', 'G. Hou', 'P. Hurck', 'A. Hurley', 'W. Imoehl', 'D. G. Ireland', 'M. M. Ito', 'I. Jaegle', 'N. S. Jarvis', 'T. Jeske', 'M. Jing', 'R. T. Jones', 'V. Kakoyan', 'G. Kalicy', 'V. Khachatryan', 'C. Kourkoumelis', 'A. LaDuke', 'I. Larin', 'D. Lawrence', 'D. I. Lersch', 'H. Li', 'B. Liu', 'K. Livingston', 'G. J. Lolos', 'L. Lorenti', 'V. Lyubovitskij', 'R. Ma', 'D. Mack', 'A. Mahmood', 'H. Marukyan', 'V. Matveev', 'M. McCaughan', 'M. McCracken', 'C. A. Meyer', 'R. Miskimen', 'R. E. Mitchell', 'K. Mizutani', 'V. Neelamana', 'L. Ng', 'E. Nissen', 'S. Orešić', 'A. I. Ostrovidov', 'Z. Papandreou', 'C. Paudel', 'R. Pedroni', 'L. Pentchev', 'K. J. Peters', 'E. Prather', 'S. Rakshit', 'J. Reinhold', 'A. Remington', 'B. G. Ritchie', 'J. Ritman', 'G. Rodriguez', 'D. Romanov', 'K. Saldana', 'C. Salgado', 'S. Schadmand', 'A. M. Schertz', 'K. Scheuer', 'A. Schick', 'A. Schmidt', 'R. A. Schumacher', 'J. Schwiening', 'N. Septian', 'P. Sharp', 'X. Shen', 'M. R. Shepherd', 'J. Sikes', 'A. Smith', 'E. S. Smith', 'D. I. Sober', 'A. Somov', 'S. Somov', 'J. R. Stevens', 'I. I. Strakovsky', 'B. Sumner', 'K. Suresh', 'V. V. Tarasov', 'S. Taylor', 'A. Teymurazyan', 'A. Thiel', 'T. Viducic', 'T. Whitlatch', 'N. Wickramaarachchi', 'Y. Wunderlich', 'B. Yu', 'J. Zarling', 'Z. Zhang', 'X. Zhou', 'B. Zihlmann'], 'published': '2024-07-03T17:57:15+00:00', 'updated': '2024-07-03T17:57:15+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03316v1', 'entry_id': 'http://arxiv.org/abs/2407.03316v1', 'summary': \"The spin-exotic hybrid meson $\\\\pi_{1}(1600)$ is predicted to have a large\\ndecay rate to the $\\\\omega\\\\pi\\\\pi$ final state. Using 76.6~pb$^{-1}$ of data\\ncollected with the GlueX detector, we measure the cross sections for the\\nreactions $\\\\gamma p \\\\to \\\\omega \\\\pi^+ \\\\pi^- p$, $\\\\gamma p \\\\to \\\\omega \\\\pi^0 \\\\pi^0\\np$, and $\\\\gamma p\\\\to\\\\omega\\\\pi^-\\\\pi^0\\\\Delta^{++}$ in the range $E_\\\\gamma =$ 8-10\\nGeV. Using isospin conservation, we set the first upper limits on the\\nphotoproduction cross sections of the $\\\\pi^{0}_{1}(1600)$ and\\n$\\\\pi^{-}_{1}(1600)$. We combine these limits with lattice calculations of decay\\nwidths and find that photoproduction of $\\\\eta'\\\\pi$ is the most sensitive\\ntwo-body system to search for the $\\\\pi_1(1600)$.\"}, {'title': 'Quantum dynamical criticality speeds up thermodynamic entropy production', 'authors': ['Andesson B. Nascimento', 'Lucas C. Céleri'], 'published': '2024-07-03T17:57:00+00:00', 'updated': '2024-07-03T17:57:00+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03315v1', 'entry_id': 'http://arxiv.org/abs/2407.03315v1', 'summary': 'The thermodynamics of quantum phase transitions has long been a rich area of\\nresearch, providing numerous insights and enhancing our understanding of this\\nimportant phenomenon. This theoretical framework has been well-developed\\nspecially because quantum phase transitions occur at equilibrium. However, its\\ndynamical counterpart, known as dynamical quantum phase transitions (DQPTs),\\ntakes place out-of-equilibrium, where conventional thermodynamic tools are\\ninapplicable. In this work, we make progress in this area by connecting\\ndynamical criticality to the second law of thermodynamics through a geometric\\nperspective on entropy production. Our findings, along with other recent\\ndevelopments, suggest that dynamical criticality can lead the system to highly\\ncomplex dynamics, indicating a possible pathway to thermalization.'}, {'title': 'BACON: Supercharge Your VLM with Bag-of-Concept Graph to Mitigate Hallucinations', 'authors': ['Zhantao Yang', 'Ruili Feng', 'Keyu Yan', 'Huangji Wang', 'Zhicai Wang', 'Shangwen Zhu', 'Han Zhang', 'Jie Xiao', 'Pingyu Wu', 'Kai Zhu', 'Jixuan Chen', 'Chen-Wei Xie', 'Chaojie Mao', 'Yue Yang', 'Hongyang Zhang', 'Yu Liu', 'Fan Cheng'], 'published': '2024-07-03T17:55:27+00:00', 'updated': '2024-07-03T17:55:27+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03314v1', 'entry_id': 'http://arxiv.org/abs/2407.03314v1', 'summary': 'This paper presents Bag-of-Concept Graph (BACON) to gift models with limited\\nlinguistic abilities to taste the privilege of Vision Language Models (VLMs)\\nand boost downstream tasks such as detection, visual question answering (VQA),\\nand image generation. Since the visual scenes in physical worlds are structured\\nwith complex relations between objects, BACON breaks down annotations into\\nbasic minimum elements and presents them in a graph structure. Element-wise\\nstyle enables easy understanding, and structural composition liberates\\ndifficult locating. Careful prompt design births the BACON captions with the\\nhelp of public-available VLMs and segmentation methods. In this way, we gather\\na dataset with 100K annotated images, which endow VLMs with remarkable\\ncapabilities, such as accurately generating BACON, transforming prompts into\\nBACON format, envisioning scenarios in the style of BACONr, and dynamically\\nmodifying elements within BACON through interactive dialogue and more. Wide\\nrepresentative experiments, including detection, VQA, and image generation\\ntasks, tell BACON as a lifeline to achieve previous out-of-reach tasks or excel\\nin their current cutting-edge solutions.'}, {'title': 'Relative Polar Multiplicities, the Real Link, and Morse Inequalities for Hypersurfaces', 'authors': ['David B. Massey'], 'published': '2024-07-03T17:55:22+00:00', 'updated': '2024-07-03T17:55:22+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03313v1', 'entry_id': 'http://arxiv.org/abs/2407.03313v1', 'summary': 'For a hypersurface defined by a complex analytic function, we derive\\nMorse-type inequalities between the Betti numbers of the real link of the\\nhypersurface and the relative polar multiplicities of the function.'}, {'title': 'Synthesizing data products, mathematical models, and observational measurements for lake temperature forecasting', 'authors': ['Maike F. Holthuijzen', 'Robert B. Gramacy', 'Cayelan C. Carey', 'Dave M. Higdon', 'R. Quinn Thomas'], 'published': '2024-07-03T17:54:57+00:00', 'updated': '2024-07-03T17:54:57+00:00', 'pdf_url': 'http://arxiv.org/pdf/2407.03312v1', 'entry_id': 'http://arxiv.org/abs/2407.03312v1', 'summary': 'We present a novel forecasting framework for lake water temperature profiles,\\ncrucial for managing lake ecosystems and drinking water resources. The General\\nLake Model (GLM), a one-dimensional process-based model, has been widely used\\nfor this purpose, but, similar to many process-based simulation models, it:\\nrequires a large number of input variables, many of which are stochastic;\\npresents challenges for uncertainty quantification (UQ); and can exhibit model\\nbias. To address these issues, we propose a Gaussian process (GP)\\nsurrogate-based forecasting approach that efficiently handles large,\\nhigh-dimensional data and accounts for input-dependent variability and\\nsystematic GLM bias. We validate the proposed approach and compare it with\\nother forecasting methods, including a climatological model and raw GLM\\nsimulations. Our results demonstrate that our bias-corrected GP surrogate\\n(GPBC) can outperform competing approaches in terms of forecast accuracy and UQ\\nup to two weeks into the future.'}]\n", "2024-07-06 09:04:12,480 - INFO - Starting ingestion of 10 documents\n" ] } ], "source": [ "result = run_ingestion_pipeline(query=\"System of Agents\", max_results=10)" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [], "source": [ "import arxiv\n", "\n", "query = \"System of Agents\"\n", "max_results = 2\n", "\n", "client = arxiv.Client(page_size=max_results, delay_seconds=3, num_retries=3)\n", "search = arxiv.Search(query=query, max_results=max_results, sort_by=arxiv.SortCriterion.SubmittedDate)\n", "results = []\n", "\n", "client_results = client.results(search)" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "type(client_results): \n" ] } ], "source": [ "print(f\"type(client_results): {type(client_results)}\")" ] }, { "cell_type": "markdown", "metadata": {}, "source": [] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2024-07-06 09:48:09,300 - INFO - Requesting page (first: True, try: 0): https://export.arxiv.org/api/query?search_query=System+of+Agents&id_list=&sortBy=submittedDate&sortOrder=descending&start=0&max_results=2\n", "2024-07-06 09:48:10,487 - INFO - Got first page: 2 of 2492622 total results\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "\n", "Title: Planetarium: A Rigorous Benchmark for Translating Text to Structured Planning Languages\n", "Authors: ['Max Zuo', 'Francisco Piedrahita Velez', 'Xiaochen Li', 'Michael L. Littman', 'Stephen H. Bach']\n", "Published: 2024-07-03 17:59:53+00:00\n", "Summary: Many recent works have explored using language models for planning problems.\n", "One line of research focuses on translating natural language descriptions of\n", "planning tasks into structured planning languages, such as the planning domain\n", "definition language (PDDL). While this approach is promising, accurately\n", "measuring the quality of generated PDDL code continues to pose significant\n", "challenges. First, generated PDDL code is typically evaluated using planning\n", "validators that check whether the problem can be solved with a planner. This\n", "method is insufficient because a language model might generate valid PDDL code\n", "that does not align with the natural language description of the task. Second,\n", "existing evaluation sets often have natural language descriptions of the\n", "planning task that closely resemble the ground truth PDDL, reducing the\n", "challenge of the task. To bridge this gap, we introduce \\benchmarkName, a\n", "benchmark designed to evaluate language models' ability to generate PDDL code\n", "from natural language descriptions of planning tasks. We begin by creating a\n", "PDDL equivalence algorithm that rigorously evaluates the correctness of PDDL\n", "code generated by language models by flexibly comparing it against a ground\n", "truth PDDL. Then, we present a dataset of $132,037$ text-to-PDDL pairs across\n", "13 different tasks, with varying levels of difficulty. Finally, we evaluate\n", "several API-access and open-weight language models that reveal this task's\n", "complexity. For example, $87.6\\%$ of the PDDL problem descriptions generated by\n", "GPT-4o are syntactically parseable, $82.2\\%$ are valid, solve-able problems,\n", "but only $35.1\\%$ are semantically correct, highlighting the need for a more\n", "rigorous benchmark for this problem.\n", "\n", "Title: InternLM-XComposer-2.5: A Versatile Large Vision Language Model Supporting Long-Contextual Input and Output\n", "Authors: ['Pan Zhang', 'Xiaoyi Dong', 'Yuhang Zang', 'Yuhang Cao', 'Rui Qian', 'Lin Chen', 'Qipeng Guo', 'Haodong Duan', 'Bin Wang', 'Linke Ouyang', 'Songyang Zhang', 'Wenwei Zhang', 'Yining Li', 'Yang Gao', 'Peng Sun', 'Xinyue Zhang', 'Wei Li', 'Jingwen Li', 'Wenhai Wang', 'Hang Yan', 'Conghui He', 'Xingcheng Zhang', 'Kai Chen', 'Jifeng Dai', 'Yu Qiao', 'Dahua Lin', 'Jiaqi Wang']\n", "Published: 2024-07-03 17:59:21+00:00\n", "Summary: We present InternLM-XComposer-2.5 (IXC-2.5), a versatile large-vision\n", "language model that supports long-contextual input and output. IXC-2.5 excels\n", "in various text-image comprehension and composition applications, achieving\n", "GPT-4V level capabilities with merely 7B LLM backend. Trained with 24K\n", "interleaved image-text contexts, it can seamlessly extend to 96K long contexts\n", "via RoPE extrapolation. This long-context capability allows IXC-2.5 to excel in\n", "tasks requiring extensive input and output contexts. Compared to its previous\n", "2.0 version, InternLM-XComposer-2.5 features three major upgrades in\n", "vision-language comprehension: (1) Ultra-High Resolution Understanding, (2)\n", "Fine-Grained Video Understanding, and (3) Multi-Turn Multi-Image Dialogue. In\n", "addition to comprehension, IXC-2.5 extends to two compelling applications using\n", "extra LoRA parameters for text-image composition: (1) Crafting Webpages and (2)\n", "Composing High-Quality Text-Image Articles. IXC-2.5 has been evaluated on 28\n", "benchmarks, outperforming existing open-source state-of-the-art models on 16\n", "benchmarks. It also surpasses or competes closely with GPT-4V and Gemini Pro on\n", "16 key tasks. The InternLM-XComposer-2.5 is publicly available at\n", "https://github.com/InternLM/InternLM-XComposer.\n", "\n" ] } ], "source": [ "import arxiv\n", "import logging\n", "\n", "# Configure logging\n", "logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')\n", "\n", "query = \"System of Agents\"\n", "max_results = 2\n", "\n", "client = arxiv.Client(page_size=max_results, delay_seconds=3, num_retries=3)\n", "search = arxiv.Search(query=query, max_results=max_results, sort_by=arxiv.SortCriterion.SubmittedDate)\n", "client_results = client.results(search)\n", "\n", "# Convert client_results to a list\n", "results_list = list(client_results)\n", "\n", "# Check the type of results_list\n", "print(type(results_list))\n", "\n", "# Process each result\n", "for result in results_list:\n", " print(f\"Title: {result.title}\")\n", " print(f\"Authors: {[author.name for author in result.authors]}\")\n", " print(f\"Published: {result.published}\")\n", " print(f\"Summary: {result.summary}\\n\")\n" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "2024-07-06 09:52:09,664 - INFO - Requesting page (first: True, try: 0): https://export.arxiv.org/api/query?search_query=System+of+Agents&id_list=&sortBy=submittedDate&sortOrder=descending&start=0&max_results=10\n", "2024-07-06 09:52:10,994 - INFO - Got first page: 10 of 2492622 total results\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Entry_id: http://arxiv.org/abs/2407.03321v1\n", "Updated: 2024-07-03 17:59:53+00:00\n", "Published: 2024-07-03 17:59:53+00:00\n", "Title: Planetarium: A Rigorous Benchmark for Translating Text to Structured Planning Languages\n", "Authors: [arxiv.Result.Author('Max Zuo'), arxiv.Result.Author('Francisco Piedrahita Velez'), arxiv.Result.Author('Xiaochen Li'), arxiv.Result.Author('Michael L. Littman'), arxiv.Result.Author('Stephen H. Bach')]\n", "Comment: None\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: cs.CL\n", "Categories: ['cs.CL', 'cs.AI', 'cs.LG']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03321v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03321v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03321v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03320v1\n", "Updated: 2024-07-03 17:59:21+00:00\n", "Published: 2024-07-03 17:59:21+00:00\n", "Title: InternLM-XComposer-2.5: A Versatile Large Vision Language Model Supporting Long-Contextual Input and Output\n", "Authors: [arxiv.Result.Author('Pan Zhang'), arxiv.Result.Author('Xiaoyi Dong'), arxiv.Result.Author('Yuhang Zang'), arxiv.Result.Author('Yuhang Cao'), arxiv.Result.Author('Rui Qian'), arxiv.Result.Author('Lin Chen'), arxiv.Result.Author('Qipeng Guo'), arxiv.Result.Author('Haodong Duan'), arxiv.Result.Author('Bin Wang'), arxiv.Result.Author('Linke Ouyang'), arxiv.Result.Author('Songyang Zhang'), arxiv.Result.Author('Wenwei Zhang'), arxiv.Result.Author('Yining Li'), arxiv.Result.Author('Yang Gao'), arxiv.Result.Author('Peng Sun'), arxiv.Result.Author('Xinyue Zhang'), arxiv.Result.Author('Wei Li'), arxiv.Result.Author('Jingwen Li'), arxiv.Result.Author('Wenhai Wang'), arxiv.Result.Author('Hang Yan'), arxiv.Result.Author('Conghui He'), arxiv.Result.Author('Xingcheng Zhang'), arxiv.Result.Author('Kai Chen'), arxiv.Result.Author('Jifeng Dai'), arxiv.Result.Author('Yu Qiao'), arxiv.Result.Author('Dahua Lin'), arxiv.Result.Author('Jiaqi Wang')]\n", "Comment: Technical Report. https://github.com/InternLM/InternLM-XComposer\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: cs.CV\n", "Categories: ['cs.CV', 'cs.CL']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03320v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03320v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03320v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03319v1\n", "Updated: 2024-07-03 17:59:18+00:00\n", "Published: 2024-07-03 17:59:18+00:00\n", "Title: `Interaction annealing' to determine effective quantized valence and orbital structure: an illustration with ferro-orbital order in WTe$_2$\n", "Authors: [arxiv.Result.Author('Ruoshi Jiang'), arxiv.Result.Author('Fangyuan Gu'), arxiv.Result.Author('Wei Ku')]\n", "Comment: 6 pages, 3 figures\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: cond-mat.str-el\n", "Categories: ['cond-mat.str-el', 'cond-mat.mtrl-sci', 'physics.comp-ph']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03319v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03319v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03319v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03318v1\n", "Updated: 2024-07-03 17:58:22+00:00\n", "Published: 2024-07-03 17:58:22+00:00\n", "Title: Fair Division of Indivisible Chores via Earning Restricted Equilibria\n", "Authors: [arxiv.Result.Author('Jugal Garg'), arxiv.Result.Author('Aniket Murhekar'), arxiv.Result.Author('John Qin')]\n", "Comment: 54 pages\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: cs.GT\n", "Categories: ['cs.GT']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03318v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03318v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03318v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03317v1\n", "Updated: 2024-07-03 17:58:11+00:00\n", "Published: 2024-07-03 17:58:11+00:00\n", "Title: Quantum Geometry Probed by Chiral Excitonic Optical Response of Chern Insulators\n", "Authors: [arxiv.Result.Author('Wen-Xuan Qiu'), arxiv.Result.Author('Fengcheng Wu')]\n", "Comment: 6+5 pages,4+2 figures\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: cond-mat.mes-hall\n", "Categories: ['cond-mat.mes-hall', 'cond-mat.mtrl-sci', 'cond-mat.str-el']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03317v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03317v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03317v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03316v1\n", "Updated: 2024-07-03 17:57:15+00:00\n", "Published: 2024-07-03 17:57:15+00:00\n", "Title: An Upper Limit on the Photoproduction Cross Section of the Spin-Exotic $π_1(1600)$\n", "Authors: [arxiv.Result.Author('F. Afzal'), arxiv.Result.Author('C. S. Akondi'), arxiv.Result.Author('M. Albrecht'), arxiv.Result.Author('M. Amaryan'), arxiv.Result.Author('S. Arrigo'), arxiv.Result.Author('V. Arroyave'), arxiv.Result.Author('A. Asaturyan'), arxiv.Result.Author('A. Austregesilo'), arxiv.Result.Author('Z. Baldwin'), arxiv.Result.Author('F. Barbosa'), arxiv.Result.Author('J. Barlow'), arxiv.Result.Author('E. Barriga'), arxiv.Result.Author('R. Barsotti'), arxiv.Result.Author('D. Barton'), arxiv.Result.Author('V. Baturin'), arxiv.Result.Author('V. V. Berdnikov'), arxiv.Result.Author('T. Black'), arxiv.Result.Author('W. Boeglin'), arxiv.Result.Author('M. Boer'), arxiv.Result.Author('W. J. Briscoe'), arxiv.Result.Author('T. Britton'), arxiv.Result.Author('S. Cao'), arxiv.Result.Author('E. Chudakov'), arxiv.Result.Author('G. Chung'), arxiv.Result.Author('P. L. Cole'), arxiv.Result.Author('O. Cortes'), arxiv.Result.Author('V. Crede'), arxiv.Result.Author('M. M. Dalton'), arxiv.Result.Author('D. Darulis'), arxiv.Result.Author('A. Deur'), arxiv.Result.Author('S. Dobbs'), arxiv.Result.Author('A. Dolgolenko'), arxiv.Result.Author('M. Dugger'), arxiv.Result.Author('R. Dzhygadlo'), arxiv.Result.Author('D. Ebersole'), arxiv.Result.Author('M. Edo'), arxiv.Result.Author('H. Egiyan'), arxiv.Result.Author('T. Erbora'), arxiv.Result.Author('P. Eugenio'), arxiv.Result.Author('A. Fabrizi'), arxiv.Result.Author('C. Fanelli'), arxiv.Result.Author('S. Fang'), arxiv.Result.Author('J. Fitches'), arxiv.Result.Author('A. M. Foda'), arxiv.Result.Author('S. Furletov'), arxiv.Result.Author('L. Gan'), arxiv.Result.Author('H. Gao'), arxiv.Result.Author('A. Gardner'), arxiv.Result.Author('A. Gasparian'), arxiv.Result.Author('D. Glazier'), arxiv.Result.Author('C. Gleason'), arxiv.Result.Author('V. S. Goryachev'), arxiv.Result.Author('B. Grube'), arxiv.Result.Author('J. Guo'), arxiv.Result.Author('L. Guo'), arxiv.Result.Author('J. Hernandez'), arxiv.Result.Author('K. Hernandez'), arxiv.Result.Author('N. D. Hoffman'), arxiv.Result.Author('D. Hornidge'), arxiv.Result.Author('G. Hou'), arxiv.Result.Author('P. Hurck'), arxiv.Result.Author('A. Hurley'), arxiv.Result.Author('W. Imoehl'), arxiv.Result.Author('D. G. Ireland'), arxiv.Result.Author('M. M. Ito'), arxiv.Result.Author('I. Jaegle'), arxiv.Result.Author('N. S. Jarvis'), arxiv.Result.Author('T. Jeske'), arxiv.Result.Author('M. Jing'), arxiv.Result.Author('R. T. Jones'), arxiv.Result.Author('V. Kakoyan'), arxiv.Result.Author('G. Kalicy'), arxiv.Result.Author('V. Khachatryan'), arxiv.Result.Author('C. Kourkoumelis'), arxiv.Result.Author('A. LaDuke'), arxiv.Result.Author('I. Larin'), arxiv.Result.Author('D. Lawrence'), arxiv.Result.Author('D. I. Lersch'), arxiv.Result.Author('H. Li'), arxiv.Result.Author('B. Liu'), arxiv.Result.Author('K. Livingston'), arxiv.Result.Author('G. J. Lolos'), arxiv.Result.Author('L. Lorenti'), arxiv.Result.Author('V. Lyubovitskij'), arxiv.Result.Author('R. Ma'), arxiv.Result.Author('D. Mack'), arxiv.Result.Author('A. Mahmood'), arxiv.Result.Author('H. Marukyan'), arxiv.Result.Author('V. Matveev'), arxiv.Result.Author('M. McCaughan'), arxiv.Result.Author('M. McCracken'), arxiv.Result.Author('C. A. Meyer'), arxiv.Result.Author('R. Miskimen'), arxiv.Result.Author('R. E. Mitchell'), arxiv.Result.Author('K. Mizutani'), arxiv.Result.Author('V. Neelamana'), arxiv.Result.Author('L. Ng'), arxiv.Result.Author('E. Nissen'), arxiv.Result.Author('S. Orešić'), arxiv.Result.Author('A. I. Ostrovidov'), arxiv.Result.Author('Z. Papandreou'), arxiv.Result.Author('C. Paudel'), arxiv.Result.Author('R. Pedroni'), arxiv.Result.Author('L. Pentchev'), arxiv.Result.Author('K. J. Peters'), arxiv.Result.Author('E. Prather'), arxiv.Result.Author('S. Rakshit'), arxiv.Result.Author('J. Reinhold'), arxiv.Result.Author('A. Remington'), arxiv.Result.Author('B. G. Ritchie'), arxiv.Result.Author('J. Ritman'), arxiv.Result.Author('G. Rodriguez'), arxiv.Result.Author('D. Romanov'), arxiv.Result.Author('K. Saldana'), arxiv.Result.Author('C. Salgado'), arxiv.Result.Author('S. Schadmand'), arxiv.Result.Author('A. M. Schertz'), arxiv.Result.Author('K. Scheuer'), arxiv.Result.Author('A. Schick'), arxiv.Result.Author('A. Schmidt'), arxiv.Result.Author('R. A. Schumacher'), arxiv.Result.Author('J. Schwiening'), arxiv.Result.Author('N. Septian'), arxiv.Result.Author('P. Sharp'), arxiv.Result.Author('X. Shen'), arxiv.Result.Author('M. R. Shepherd'), arxiv.Result.Author('J. Sikes'), arxiv.Result.Author('A. Smith'), arxiv.Result.Author('E. S. Smith'), arxiv.Result.Author('D. I. Sober'), arxiv.Result.Author('A. Somov'), arxiv.Result.Author('S. Somov'), arxiv.Result.Author('J. R. Stevens'), arxiv.Result.Author('I. I. Strakovsky'), arxiv.Result.Author('B. Sumner'), arxiv.Result.Author('K. Suresh'), arxiv.Result.Author('V. V. Tarasov'), arxiv.Result.Author('S. Taylor'), arxiv.Result.Author('A. Teymurazyan'), arxiv.Result.Author('A. Thiel'), arxiv.Result.Author('T. Viducic'), arxiv.Result.Author('T. Whitlatch'), arxiv.Result.Author('N. Wickramaarachchi'), arxiv.Result.Author('Y. Wunderlich'), arxiv.Result.Author('B. Yu'), arxiv.Result.Author('J. Zarling'), arxiv.Result.Author('Z. Zhang'), arxiv.Result.Author('X. Zhou'), arxiv.Result.Author('B. Zihlmann')]\n", "Comment: 6 pages, 3 figures plus supplemental materials\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: nucl-ex\n", "Categories: ['nucl-ex', 'hep-ex']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03316v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03316v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03316v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03315v1\n", "Updated: 2024-07-03 17:57:00+00:00\n", "Published: 2024-07-03 17:57:00+00:00\n", "Title: Quantum dynamical criticality speeds up thermodynamic entropy production\n", "Authors: [arxiv.Result.Author('Andesson B. Nascimento'), arxiv.Result.Author('Lucas C. Céleri')]\n", "Comment: 8 pages, 8 figures\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: quant-ph\n", "Categories: ['quant-ph']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03315v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03315v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03315v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03314v1\n", "Updated: 2024-07-03 17:55:27+00:00\n", "Published: 2024-07-03 17:55:27+00:00\n", "Title: BACON: Supercharge Your VLM with Bag-of-Concept Graph to Mitigate Hallucinations\n", "Authors: [arxiv.Result.Author('Zhantao Yang'), arxiv.Result.Author('Ruili Feng'), arxiv.Result.Author('Keyu Yan'), arxiv.Result.Author('Huangji Wang'), arxiv.Result.Author('Zhicai Wang'), arxiv.Result.Author('Shangwen Zhu'), arxiv.Result.Author('Han Zhang'), arxiv.Result.Author('Jie Xiao'), arxiv.Result.Author('Pingyu Wu'), arxiv.Result.Author('Kai Zhu'), arxiv.Result.Author('Jixuan Chen'), arxiv.Result.Author('Chen-Wei Xie'), arxiv.Result.Author('Chaojie Mao'), arxiv.Result.Author('Yue Yang'), arxiv.Result.Author('Hongyang Zhang'), arxiv.Result.Author('Yu Liu'), arxiv.Result.Author('Fan Cheng')]\n", "Comment: None\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: cs.CV\n", "Categories: ['cs.CV', 'cs.CL', 'cs.DB']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03314v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03314v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03314v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03313v1\n", "Updated: 2024-07-03 17:55:22+00:00\n", "Published: 2024-07-03 17:55:22+00:00\n", "Title: Relative Polar Multiplicities, the Real Link, and Morse Inequalities for Hypersurfaces\n", "Authors: [arxiv.Result.Author('David B. Massey')]\n", "Comment: 4 pages\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: math.AG\n", "Categories: ['math.AG']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03313v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03313v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03313v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n", "Entry_id: http://arxiv.org/abs/2407.03312v1\n", "Updated: 2024-07-03 17:54:57+00:00\n", "Published: 2024-07-03 17:54:57+00:00\n", "Title: Synthesizing data products, mathematical models, and observational measurements for lake temperature forecasting\n", "Authors: [arxiv.Result.Author('Maike F. Holthuijzen'), arxiv.Result.Author('Robert B. Gramacy'), arxiv.Result.Author('Cayelan C. Carey'), arxiv.Result.Author('Dave M. Higdon'), arxiv.Result.Author('R. Quinn Thomas')]\n", "Comment: 34 pages, 17 figures\n", "Journal_ref: None\n", "Doi: None\n", "Primary_category: stat.AP\n", "Categories: ['stat.AP', 'G.3; J.2']\n", "Links: [arxiv.Result.Link('http://arxiv.org/abs/2407.03312v1', title=None, rel='alternate', content_type=None), arxiv.Result.Link('http://arxiv.org/pdf/2407.03312v1', title='pdf', rel='related', content_type=None)]\n", "Pdf_url: http://arxiv.org/pdf/2407.03312v1\n", "\n", "--------------------------------------------------------------------------------\n", "\n" ] } ], "source": [ "import arxiv\n", "import logging\n", "\n", "# Configure logging\n", "logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')\n", "\n", "query = \"System of Agents\"\n", "max_results = 10\n", "\n", "client = arxiv.Client(page_size=max_results, delay_seconds=3, num_retries=3)\n", "search = arxiv.Search(query=query, max_results=max_results, sort_by=arxiv.SortCriterion.SubmittedDate)\n", "client_results = client.results(search)\n", "\n", "# Convert client_results to a list\n", "results_list = list(client_results)\n", "\n", "# Define fields to exclude\n", "exclude_fields = ['summary', '_raw']\n", "\n", "# Process each result\n", "for result in results_list:\n", " result_dict = vars(result)\n", " for key, value in result_dict.items():\n", " if key not in exclude_fields:\n", " print(f\"{key.capitalize()}: {value}\")\n", " print(\"\\n\" + \"-\"*80 + \"\\n\") # Separator between results\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": ".venv", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.10.13" } }, "nbformat": 4, "nbformat_minor": 2 }