From 595a66b8361d6a240aafa6bb4450f0133b6a7a96 Mon Sep 17 00:00:00 2001 From: Shagun Sodhani Date: Sun, 12 Feb 2023 13:52:02 -0500 Subject: [PATCH] Add toolformer paper --- 404.html | 2 +- ...-Model-for-Natural-Language-Inference.html | 8 +- ...pendency-Parser-using-Neural-Networks.html | 8 +- A-Foliated-View-of-Transfer-Learning.html | 8 +- ...Deep-Learning-with-Symbolic-Knowledge.html | 8 +- ...-Learning-of-Language-Representations.html | 8 +- Abductive-Commonsense-Reasoning.html | 8 +- ...batch-SGD-Training-ImageNet-in-1-Hour.html | 8 +- ...k-Prediction-a-View-from-the-Trenches.html | 8 +- ...-with-Composition-in-Classifier-Space.html | 8 +- ...ing-in-Gradient-Based-Neural-Networks.html | 8 +- ...en-Representations-and-Task-Semantics.html | 8 +- ...works-for-Natural-Language-Processing.html | 8 +- ...zation-in-Deep-Reinforcement-Learning.html | 8 +- ...ider-Optima-and-Better-Generalization.html | 8 +- ...age-Learning-With-a-Human-In-the-Loop.html | 8 +- Born-Again-Neural-Networks.html | 8 +- ...ears-later-How-the-rules-have-changed.html | 8 +- ...sentations-for-Reinforcement-Learning.html | 8 +- ...centralized-structured-storage-system.html | 8 +- ...of-Independent-Deep-Generative-Models.html | 8 +- Compositional-Explanations-of-Neurons.html | 8 +- Conditional-Similarity-Networks.html | 8 +- ...rn-Distributed-Database-System-Design.html | 8 +- Continual-learning-with-hypernetworks.html | 8 +- ...e-Learning-of-Structured-World-Models.html | 8 +- ...ng-Rates-for-Training-Neural-Networks.html | 8 +- ...ent-for-Internet-Scale-Single-Sign-On.html | 8 +- ...aking-via-Local-Economic-Transactions.html | 8 +- ...-Networks-for-YouTube-Recommendations.html | 8 +- ...rcement-Learning-and-the-Deadly-Triad.html | 8 +- ...s-using-Probabilistic-Dynamics-Models.html | 8 +- ...r-container-based-distributed-systems.html | 8 +- ...ing-the-Knowledge-in-a-Neural-Network.html | 8 +- ...ning-Skills-without-a-Reward-Function.html | 8 +- ...Discriminators-Rather-Than-Generators.html | 8 +- Efficient-Lifelong-Learning-with-A-GEM.html | 8 +- ...l-Language-in-Multi-Agent-Populations.html | 8 +- ...ion-with-Internal-and-External-Memory.html | 8 +- ...y-based-Models-for-Continual-Learning.html | 8 +- ...Purpose-of-Actions-in-Procedural-Text.html | 8 +- ...and-Data-for-Image-Question-Answering.html | 8 +- ...imple-Siamese-Representation-Learning.html | 8 +- ...nforcement-Learning-from-Observations.html | 8 +- ...-Explanation-of-Graph-Neural-Networks.html | 8 +- ...with-Micro-Batch-Pipeline-Parallelism.html | 8 +- ...ation-with-Pointer-Generator-Networks.html | 8 +- ...nough-Compositional-Data-Augmentation.html | 8 +- ...tor-Learner-Architectures-for-Deep-RL.html | 8 +- ...-Balancing-in-Deep-Multitask-Networks.html | 8 +- Gradient-Surgery-for-Multi-Task-Learning.html | 8 +- ...lection-for-online-continual-learning.html | 8 +- ...-Representation-Learning-for-Networks.html | 8 +- Hamiltonian-Neural-Networks.html | 8 +- ...-Yield,-and-Scalable-Tolerant-Systems.html | 8 +- ...-Learning-with-Differentiable-Pooling.html | 8 +- ...e-of-Proprioceptive-Periodic-Policies.html | 8 +- ...rder-organization-of-complex-networks.html | 8 +- Hindsight-Experience-Replay.html | 8 +- HoME-a-Household-Multimodal-Environment.html | 8 +- How-to-train-your-MAML.html | 8 +- ...-are-features-in-deep-neural-networks.html | 8 +- HyperNetworks.html | 8 +- ...gents-for-Deep-Reinforcement-Learning.html | 8 +- ...-Evidence-with-Reinforcement-Learning.html | 8 +- Kronecker-Recurrent-Units.html | 8 +- Large-Memory-Layers-with-Product-Keys.html | 8 +- ...-Optimizers-that-Scale-and-Generalize.html | 8 +- ...ng-Explanations-That-Are-Hard-To-Vary.html | 8 +- Learning-Independent-Causal-Mechanisms.html | 8 +- ...AT-Solver-from-Single-Bit-Supervision.html | 8 +- ...to-Compute-Word-Embeddings-On-the-Fly.html | 8 +- ...-Images-for-Visual-Question-Answering.html | 8 +- ...-Memory-for-Recurrent-Neural-Networks.html | 8 +- ...cene-Decomposition-and-Representation.html | 8 +- ...standing-in-Visual-Question-Answering.html | 8 +- ...n-in-the-Wild-Findings-and-Challenges.html | 8 +- ...hogi-by-Planning-with-a-Learned-Model.html | 8 +- ...Abstract-Reasoning-in-Neural-Networks.html | 8 +- Memory-Based-Parameter-Adaption.html | 8 +- ...-Unsupervised-Representation-Learning.html | 8 +- ...-of-Structured-Exploration-Strategies.html | 8 +- ...hical-Lifelong-Reinforcement-Learning.html | 8 +- Modular-meta-learning.html | 8 +- ...le-Model-Based-Reinforcement-Learning.html | 8 +- ...ating-Learning-via-Knowledge-Transfer.html | 8 +- ...e-Building-Blocks-of-Complex-Networks.html | 8 +- ...zation-in-Deep-Reinforcement-Learning.html | 8 +- ...Message-Passing-for-Quantum-Chemistry.html | 8 +- Neural-Module-Networks.html | 8 +- ...nal-Inference-for-Interacting-Systems.html | 8 +- ...Overfitting-in-Reinforcement-Learning.html | 8 +- ...Warm-Starting-Neural-Network-Training.html | 8 +- One-Model-To-Learn-Them-All.html | 8 +- ...xtrapolation-via-Structured-MaxEnt-RL.html | 8 +- ...with-Memory-Augmented-Neural-Networks.html | 8 +- ...arsely-Gated-Mixture-of-Experts-Layer.html | 8 +- ...-New-Benchmark-for-Physical-Reasoning.html | 8 +- ...rge-scale-Heterogeneous-Text-Networks.html | 8 +- ...Learning-Hierarchical-Representations.html | 8 +- Pointer-Networks.html | 8 +- ...-Predicting-Clicks-on-Ads-at-Facebook.html | 8 +- ...ng-Graph-Neural-Networks-with-Kernels.html | 8 +- ...tribution-Examples-in-Neural-Networks.html | 8 +- ...eralization-in-Reinforcement-Learning.html | 8 +- ...rehension-with-Self-matching-Networks.html | 8 +- ...derstanding-the-Effectiveness-of-MAML.html | 8 +- ...pedia-to-Answer-Open-Domain-Questions.html | 8 +- ...Stop-Reading-in-Machine-Comprehension.html | 8 +- ...tworks-for-Neural-Machine-Translation.html | 8 +- Relational-Reinforcement-Learning.html | 8 +- ...ations-Reduce-Catastrophic-Forgetting.html | 8 +- ...n-Tradeoffs-for-Hyperbolic-Embeddings.html | 8 +- ...ing-Fundamentals-of-Experience-Replay.html | 8 +- ...rvised-Learning-with-Graph-Embeddings.html | 8 +- ...ces-Managing-Technical-Debt-at-Google.html | 8 +- ...Permutation-Invariant-Neural-Networks.html | 8 +- ...aseline-for-Visual-Question-Answering.html | 8 +- ...nctions-for-Deep-Top-k-Classification.html | 8 +- StarSpace-Embed-All-The-Things.html | 8 +- ...stems-Using-Recurrent-Neural-Networks.html | 8 +- Superposition-of-many-models-into-one.html | 8 +- Supervised-Contrastive-Learning.html | 8 +- Swish-A-self-gated-activation-function.html | 8 +- ...ptation-across-Tasks-and-Environments.html | 8 +- ...Batch-Normalization-for-Meta-Learning.html | 8 +- ...rmulation-with-Reinforcement-Learning.html | 8 +- ...hesis-Training-Pruned-Neural-Networks.html | 8 +- The-Tail-at-Scale.html | 8 +- ...ined-Representations-to-Diverse-Tasks.html | 8 +- ...els-Can-Teach-Themselves-to-Use-Tools.html | 488 ++++++++++++++++++ ...-Theory-of-State-Abstraction-for-MDPs.html | 8 +- ...ural-benchmark-for-continual-learning.html | 8 +- ...zation-for-Knowledge-Graph-Completion.html | 8 +- ...fer-Learning-in-Machine-Comprehension.html | 8 +- ...tions-of-Word2Vec-for-Syntax-Problems.html | 8 +- ...pervised-Learning-By-Predicting-Noise.html | 8 +- VQA-Visual-Question-Answering.html | 8 +- ...-Than-10,000-Image-Categories-Tell-Us.html | 8 +- When-Do-Curricula-Work.html | 8 +- ...ent-Models-Don-t-Need-To-Be-Recurrent.html | 8 +- ...tric-models-in-reinforcement-learning.html | 8 +- ...epresentations-via-Gaussian-Embedding.html | 8 +- ...del,-and-You-Should-Treat-it-Like-One.html | 8 +- ...-by-Generating-Task-specific-Adapters.html | 8 +- archieve.html | 4 +- atom.xml | 230 ++++++--- index.html | 14 +- mixup-Beyond-Empirical-Risk-Minimization.html | 8 +- page10/index.html | 2 +- page11/index.html | 2 +- page12/index.html | 2 +- page13/index.html | 2 +- page14/index.html | 2 +- page15/index.html | 2 +- page2/index.html | 2 +- page3/index.html | 2 +- page4/index.html | 2 +- page5/index.html | 2 +- page6/index.html | 2 +- page7/index.html | 2 +- page8/index.html | 2 +- page9/index.html | 2 +- tags.html | 104 ++-- 164 files changed, 1323 insertions(+), 699 deletions(-) create mode 100644 Toolformer-Language-Models-Can-Teach-Themselves-to-Use-Tools.html diff --git a/404.html b/404.html index 6792b7a4..f77559d0 100644 --- a/404.html +++ b/404.html @@ -159,7 +159,7 @@ diff --git a/A-Decomposable-Attention-Model-for-Natural-Language-Inference.html b/A-Decomposable-Attention-Model-for-Natural-Language-Inference.html index d75cff45..11a7fd4c 100644 --- a/A-Decomposable-Attention-Model-for-Natural-Language-Inference.html +++ b/A-Decomposable-Attention-Model-for-Natural-Language-Inference.html @@ -159,7 +159,7 @@ @@ -257,9 +257,9 @@

Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/A-Fast-and-Accurate-Dependency-Parser-using-Neural-Networks.html b/A-Fast-and-Accurate-Dependency-Parser-using-Neural-Networks.html index 22f999ed..4eed5b47 100644 --- a/A-Fast-and-Accurate-Dependency-Parser-using-Neural-Networks.html +++ b/A-Fast-and-Accurate-Dependency-Parser-using-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -258,9 +258,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/A-Foliated-View-of-Transfer-Learning.html b/A-Foliated-View-of-Transfer-Learning.html index 881c62d4..1d2e2cef 100644 --- a/A-Foliated-View-of-Transfer-Learning.html +++ b/A-Foliated-View-of-Transfer-Learning.html @@ -159,7 +159,7 @@ @@ -263,9 +263,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/A-Semantic-Loss-Function-for-Deep-Learning-with-Symbolic-Knowledge.html b/A-Semantic-Loss-Function-for-Deep-Learning-with-Symbolic-Knowledge.html index 4927c339..e3d58dd9 100644 --- a/A-Semantic-Loss-Function-for-Deep-Learning-with-Symbolic-Knowledge.html +++ b/A-Semantic-Loss-Function-for-Deep-Learning-with-Symbolic-Knowledge.html @@ -159,7 +159,7 @@ @@ -346,9 +346,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/ALBERT-A-Lite-BERT-for-Self-supervised-Learning-of-Language-Representations.html b/ALBERT-A-Lite-BERT-for-Self-supervised-Learning-of-Language-Representations.html index b25a1d27..41aa63de 100644 --- a/ALBERT-A-Lite-BERT-for-Self-supervised-Learning-of-Language-Representations.html +++ b/ALBERT-A-Lite-BERT-for-Self-supervised-Learning-of-Language-Representations.html @@ -159,7 +159,7 @@ @@ -305,9 +305,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Abductive-Commonsense-Reasoning.html b/Abductive-Commonsense-Reasoning.html index 7533e81e..377e7e48 100644 --- a/Abductive-Commonsense-Reasoning.html +++ b/Abductive-Commonsense-Reasoning.html @@ -159,7 +159,7 @@ @@ -271,9 +271,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Accurate-Large-Minibatch-SGD-Training-ImageNet-in-1-Hour.html b/Accurate-Large-Minibatch-SGD-Training-ImageNet-in-1-Hour.html index 14cb61c9..ff402f9e 100644 --- a/Accurate-Large-Minibatch-SGD-Training-ImageNet-in-1-Hour.html +++ b/Accurate-Large-Minibatch-SGD-Training-ImageNet-in-1-Hour.html @@ -159,7 +159,7 @@ @@ -298,9 +298,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Ad-Click-Prediction-a-View-from-the-Trenches.html b/Ad-Click-Prediction-a-View-from-the-Trenches.html index 79404e4d..cf593ccc 100644 --- a/Ad-Click-Prediction-a-View-from-the-Trenches.html +++ b/Ad-Click-Prediction-a-View-from-the-Trenches.html @@ -159,7 +159,7 @@ @@ -335,9 +335,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Alpha-Net-Adaptation-with-Composition-in-Classifier-Space.html b/Alpha-Net-Adaptation-with-Composition-in-Classifier-Space.html index 4ac23e50..7b69d40c 100644 --- a/Alpha-Net-Adaptation-with-Composition-in-Classifier-Space.html +++ b/Alpha-Net-Adaptation-with-Composition-in-Classifier-Space.html @@ -159,7 +159,7 @@ @@ -279,9 +279,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/An-Empirical-Investigation-of-Catastrophic-Forgetting-in-Gradient-Based-Neural-Networks.html b/An-Empirical-Investigation-of-Catastrophic-Forgetting-in-Gradient-Based-Neural-Networks.html index 6882f090..dd9c8e6a 100644 --- a/An-Empirical-Investigation-of-Catastrophic-Forgetting-in-Gradient-Based-Neural-Networks.html +++ b/An-Empirical-Investigation-of-Catastrophic-Forgetting-in-Gradient-Based-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -271,9 +271,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Anatomy-of-Catastrophic-Forgetting-Hidden-Representations-and-Task-Semantics.html b/Anatomy-of-Catastrophic-Forgetting-Hidden-Representations-and-Task-Semantics.html index 9ae79da2..ab395376 100644 --- a/Anatomy-of-Catastrophic-Forgetting-Hidden-Representations-and-Task-Semantics.html +++ b/Anatomy-of-Catastrophic-Forgetting-Hidden-Representations-and-Task-Semantics.html @@ -159,7 +159,7 @@ @@ -373,9 +373,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Ask-Me-Anything-Dynamic-Memory-Networks-for-Natural-Language-Processing.html b/Ask-Me-Anything-Dynamic-Memory-Networks-for-Natural-Language-Processing.html index 85190311..08b2c9b0 100644 --- a/Ask-Me-Anything-Dynamic-Memory-Networks-for-Natural-Language-Processing.html +++ b/Ask-Me-Anything-Dynamic-Memory-Networks-for-Natural-Language-Processing.html @@ -159,7 +159,7 @@ @@ -344,9 +344,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Assessing-Generalization-in-Deep-Reinforcement-Learning.html b/Assessing-Generalization-in-Deep-Reinforcement-Learning.html index 85d2f745..7c82930a 100644 --- a/Assessing-Generalization-in-Deep-Reinforcement-Learning.html +++ b/Assessing-Generalization-in-Deep-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -332,9 +332,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Averaging-Weights-leads-to-Wider-Optima-and-Better-Generalization.html b/Averaging-Weights-leads-to-Wider-Optima-and-Better-Generalization.html index 76aa3330..585f7403 100644 --- a/Averaging-Weights-leads-to-Wider-Optima-and-Better-Generalization.html +++ b/Averaging-Weights-leads-to-Wider-Optima-and-Better-Generalization.html @@ -159,7 +159,7 @@ @@ -282,9 +282,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/BabyAI-First-Steps-Towards-Grounded-Language-Learning-With-a-Human-In-the-Loop.html b/BabyAI-First-Steps-Towards-Grounded-Language-Learning-With-a-Human-In-the-Loop.html index 28c23ce4..9566e083 100644 --- a/BabyAI-First-Steps-Towards-Grounded-Language-Learning-With-a-Human-In-the-Loop.html +++ b/BabyAI-First-Steps-Towards-Grounded-Language-Learning-With-a-Human-In-the-Loop.html @@ -159,7 +159,7 @@ @@ -345,9 +345,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Born-Again-Neural-Networks.html b/Born-Again-Neural-Networks.html index 5f0cfb3b..e0c4a5da 100644 --- a/Born-Again-Neural-Networks.html +++ b/Born-Again-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -314,9 +314,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/CAP-twelve-years-later-How-the-rules-have-changed.html b/CAP-twelve-years-later-How-the-rules-have-changed.html index ba3deb85..0e818ecf 100644 --- a/CAP-twelve-years-later-How-the-rules-have-changed.html +++ b/CAP-twelve-years-later-How-the-rules-have-changed.html @@ -159,7 +159,7 @@ @@ -345,9 +345,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/CURL-Contrastive-Unsupervised-Representations-for-Reinforcement-Learning.html b/CURL-Contrastive-Unsupervised-Representations-for-Reinforcement-Learning.html index 974c262e..1965470c 100644 --- a/CURL-Contrastive-Unsupervised-Representations-for-Reinforcement-Learning.html +++ b/CURL-Contrastive-Unsupervised-Representations-for-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -307,9 +307,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Cassandra-a-decentralized-structured-storage-system.html b/Cassandra-a-decentralized-structured-storage-system.html index 071e3591..6b15b46e 100644 --- a/Cassandra-a-decentralized-structured-storage-system.html +++ b/Cassandra-a-decentralized-structured-storage-system.html @@ -159,7 +159,7 @@ @@ -292,9 +292,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Competitive-Training-of-Mixtures-of-Independent-Deep-Generative-Models.html b/Competitive-Training-of-Mixtures-of-Independent-Deep-Generative-Models.html index 889b9122..98ce4822 100644 --- a/Competitive-Training-of-Mixtures-of-Independent-Deep-Generative-Models.html +++ b/Competitive-Training-of-Mixtures-of-Independent-Deep-Generative-Models.html @@ -159,7 +159,7 @@ @@ -286,9 +286,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Compositional-Explanations-of-Neurons.html b/Compositional-Explanations-of-Neurons.html index cdf7741e..cd0a364c 100644 --- a/Compositional-Explanations-of-Neurons.html +++ b/Compositional-Explanations-of-Neurons.html @@ -159,7 +159,7 @@ @@ -346,9 +346,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Conditional-Similarity-Networks.html b/Conditional-Similarity-Networks.html index e73030ea..840f45b1 100644 --- a/Conditional-Similarity-Networks.html +++ b/Conditional-Similarity-Networks.html @@ -159,7 +159,7 @@ @@ -294,9 +294,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Consistency-Tradeoffs-in-Modern-Distributed-Database-System-Design.html b/Consistency-Tradeoffs-in-Modern-Distributed-Database-System-Design.html index cc07f959..957dc129 100644 --- a/Consistency-Tradeoffs-in-Modern-Distributed-Database-System-Design.html +++ b/Consistency-Tradeoffs-in-Modern-Distributed-Database-System-Design.html @@ -159,7 +159,7 @@ @@ -314,9 +314,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Continual-learning-with-hypernetworks.html b/Continual-learning-with-hypernetworks.html index 4f1f081d..4f61c15c 100644 --- a/Continual-learning-with-hypernetworks.html +++ b/Continual-learning-with-hypernetworks.html @@ -159,7 +159,7 @@ @@ -311,9 +311,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Contrastive-Learning-of-Structured-World-Models.html b/Contrastive-Learning-of-Structured-World-Models.html index 3ee06647..6e6062a4 100644 --- a/Contrastive-Learning-of-Structured-World-Models.html +++ b/Contrastive-Learning-of-Structured-World-Models.html @@ -159,7 +159,7 @@ @@ -322,9 +322,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Cyclical-Learning-Rates-for-Training-Neural-Networks.html b/Cyclical-Learning-Rates-for-Training-Neural-Networks.html index 18ae4cde..6bf6d1dc 100644 --- a/Cyclical-Learning-Rates-for-Training-Neural-Networks.html +++ b/Cyclical-Learning-Rates-for-Training-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -257,9 +257,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Data-Management-for-Internet-Scale-Single-Sign-On.html b/Data-Management-for-Internet-Scale-Single-Sign-On.html index 168790d1..5b06660a 100644 --- a/Data-Management-for-Internet-Scale-Single-Sign-On.html +++ b/Data-Management-for-Internet-Scale-Single-Sign-On.html @@ -159,7 +159,7 @@ @@ -318,9 +318,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Decentralized-Reinforcement-Learning-Global-Decision-Making-via-Local-Economic-Transactions.html b/Decentralized-Reinforcement-Learning-Global-Decision-Making-via-Local-Economic-Transactions.html index 4aea4669..bb92f318 100644 --- a/Decentralized-Reinforcement-Learning-Global-Decision-Making-via-Local-Economic-Transactions.html +++ b/Decentralized-Reinforcement-Learning-Global-Decision-Making-via-Local-Economic-Transactions.html @@ -159,7 +159,7 @@ @@ -325,9 +325,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Deep-Neural-Networks-for-YouTube-Recommendations.html b/Deep-Neural-Networks-for-YouTube-Recommendations.html index ba2d4a61..c1eeebf7 100644 --- a/Deep-Neural-Networks-for-YouTube-Recommendations.html +++ b/Deep-Neural-Networks-for-YouTube-Recommendations.html @@ -159,7 +159,7 @@ @@ -342,9 +342,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Deep-Reinforcement-Learning-and-the-Deadly-Triad.html b/Deep-Reinforcement-Learning-and-the-Deadly-Triad.html index 1cb3118e..c558f390 100644 --- a/Deep-Reinforcement-Learning-and-the-Deadly-Triad.html +++ b/Deep-Reinforcement-Learning-and-the-Deadly-Triad.html @@ -159,7 +159,7 @@ @@ -330,9 +330,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Deep-Reinforcement-Learning-in-a-Handful-of-Trials-using-Probabilistic-Dynamics-Models.html b/Deep-Reinforcement-Learning-in-a-Handful-of-Trials-using-Probabilistic-Dynamics-Models.html index 68f1ec7f..3a4cd5db 100644 --- a/Deep-Reinforcement-Learning-in-a-Handful-of-Trials-using-Probabilistic-Dynamics-Models.html +++ b/Deep-Reinforcement-Learning-in-a-Handful-of-Trials-using-Probabilistic-Dynamics-Models.html @@ -159,7 +159,7 @@ @@ -272,9 +272,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Design-patterns-for-container-based-distributed-systems.html b/Design-patterns-for-container-based-distributed-systems.html index 9fb46b62..7f904ec5 100644 --- a/Design-patterns-for-container-based-distributed-systems.html +++ b/Design-patterns-for-container-based-distributed-systems.html @@ -159,7 +159,7 @@ @@ -259,9 +259,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Distilling-the-Knowledge-in-a-Neural-Network.html b/Distilling-the-Knowledge-in-a-Neural-Network.html index 2343a55d..2cdcaee3 100644 --- a/Distilling-the-Knowledge-in-a-Neural-Network.html +++ b/Distilling-the-Knowledge-in-a-Neural-Network.html @@ -159,7 +159,7 @@ @@ -283,9 +283,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Diversity-is-All-You-Need-Learning-Skills-without-a-Reward-Function.html b/Diversity-is-All-You-Need-Learning-Skills-without-a-Reward-Function.html index 97c729fa..29b76d0a 100644 --- a/Diversity-is-All-You-Need-Learning-Skills-without-a-Reward-Function.html +++ b/Diversity-is-All-You-Need-Learning-Skills-without-a-Reward-Function.html @@ -159,7 +159,7 @@ @@ -295,9 +295,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/ELECTRA-Pre-training-Text-Encoders-as-Discriminators-Rather-Than-Generators.html b/ELECTRA-Pre-training-Text-Encoders-as-Discriminators-Rather-Than-Generators.html index aa61c975..0e008087 100644 --- a/ELECTRA-Pre-training-Text-Encoders-as-Discriminators-Rather-Than-Generators.html +++ b/ELECTRA-Pre-training-Text-Encoders-as-Discriminators-Rather-Than-Generators.html @@ -159,7 +159,7 @@ @@ -341,9 +341,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Efficient-Lifelong-Learning-with-A-GEM.html b/Efficient-Lifelong-Learning-with-A-GEM.html index 7349298a..2a6b3cde 100644 --- a/Efficient-Lifelong-Learning-with-A-GEM.html +++ b/Efficient-Lifelong-Learning-with-A-GEM.html @@ -159,7 +159,7 @@ @@ -355,9 +355,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Emergence-of-Grounded-Compositional-Language-in-Multi-Agent-Populations.html b/Emergence-of-Grounded-Compositional-Language-in-Multi-Agent-Populations.html index 31d69b23..f5cf560c 100644 --- a/Emergence-of-Grounded-Compositional-Language-in-Multi-Agent-Populations.html +++ b/Emergence-of-Grounded-Compositional-Language-in-Multi-Agent-Populations.html @@ -159,7 +159,7 @@ @@ -312,9 +312,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Emotional-Chatting-Machine-Emotional-Conversation-Generation-with-Internal-and-External-Memory.html b/Emotional-Chatting-Machine-Emotional-Conversation-Generation-with-Internal-and-External-Memory.html index 060b4e25..eade4822 100644 --- a/Emotional-Chatting-Machine-Emotional-Conversation-Generation-with-Internal-and-External-Memory.html +++ b/Emotional-Chatting-Machine-Emotional-Conversation-Generation-with-Internal-and-External-Memory.html @@ -159,7 +159,7 @@ @@ -270,9 +270,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Energy-based-Models-for-Continual-Learning.html b/Energy-based-Models-for-Continual-Learning.html index 006120c6..5c6ad697 100644 --- a/Energy-based-Models-for-Continual-Learning.html +++ b/Energy-based-Models-for-Continual-Learning.html @@ -159,7 +159,7 @@ @@ -325,9 +325,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Everything-Happens-for-a-Reason-Discovering-the-Purpose-of-Actions-in-Procedural-Text.html b/Everything-Happens-for-a-Reason-Discovering-the-Purpose-of-Actions-in-Procedural-Text.html index 48a40941..fa8dd5aa 100644 --- a/Everything-Happens-for-a-Reason-Discovering-the-Purpose-of-Actions-in-Procedural-Text.html +++ b/Everything-Happens-for-a-Reason-Discovering-the-Purpose-of-Actions-in-Procedural-Text.html @@ -159,7 +159,7 @@ @@ -395,9 +395,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Exploring-Models-and-Data-for-Image-Question-Answering.html b/Exploring-Models-and-Data-for-Image-Question-Answering.html index 8b5c4475..e09e36aa 100644 --- a/Exploring-Models-and-Data-for-Image-Question-Answering.html +++ b/Exploring-Models-and-Data-for-Image-Question-Answering.html @@ -159,7 +159,7 @@ @@ -268,9 +268,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Exploring-Simple-Siamese-Representation-Learning.html b/Exploring-Simple-Siamese-Representation-Learning.html index e2208fb3..9b88e3da 100644 --- a/Exploring-Simple-Siamese-Representation-Learning.html +++ b/Exploring-Simple-Siamese-Representation-Learning.html @@ -159,7 +159,7 @@ @@ -298,9 +298,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Extrapolating-Beyond-Suboptimal-Demonstrations-via-Inverse-Reinforcement-Learning-from-Observations.html b/Extrapolating-Beyond-Suboptimal-Demonstrations-via-Inverse-Reinforcement-Learning-from-Observations.html index 0ca2f46b..672cb18b 100644 --- a/Extrapolating-Beyond-Suboptimal-Demonstrations-via-Inverse-Reinforcement-Learning-from-Observations.html +++ b/Extrapolating-Beyond-Suboptimal-Demonstrations-via-Inverse-Reinforcement-Learning-from-Observations.html @@ -159,7 +159,7 @@ @@ -263,9 +263,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/GNN-Explainer-A-Tool-for-Post-hoc-Explanation-of-Graph-Neural-Networks.html b/GNN-Explainer-A-Tool-for-Post-hoc-Explanation-of-Graph-Neural-Networks.html index 07a05217..2adc462e 100644 --- a/GNN-Explainer-A-Tool-for-Post-hoc-Explanation-of-Graph-Neural-Networks.html +++ b/GNN-Explainer-A-Tool-for-Post-hoc-Explanation-of-Graph-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -391,9 +391,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/GPipe-Easy-Scaling-with-Micro-Batch-Pipeline-Parallelism.html b/GPipe-Easy-Scaling-with-Micro-Batch-Pipeline-Parallelism.html index 46e57acf..11678bb8 100644 --- a/GPipe-Easy-Scaling-with-Micro-Batch-Pipeline-Parallelism.html +++ b/GPipe-Easy-Scaling-with-Micro-Batch-Pipeline-Parallelism.html @@ -159,7 +159,7 @@ @@ -261,9 +261,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Get-To-The-Point-Summarization-with-Pointer-Generator-Networks.html b/Get-To-The-Point-Summarization-with-Pointer-Generator-Networks.html index 311254f4..89c5d0b0 100644 --- a/Get-To-The-Point-Summarization-with-Pointer-Generator-Networks.html +++ b/Get-To-The-Point-Summarization-with-Pointer-Generator-Networks.html @@ -159,7 +159,7 @@ @@ -263,9 +263,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Good-Enough-Compositional-Data-Augmentation.html b/Good-Enough-Compositional-Data-Augmentation.html index 8ae5a970..190193e7 100644 --- a/Good-Enough-Compositional-Data-Augmentation.html +++ b/Good-Enough-Compositional-Data-Augmentation.html @@ -159,7 +159,7 @@ @@ -238,9 +238,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Gossip-based-Actor-Learner-Architectures-for-Deep-RL.html b/Gossip-based-Actor-Learner-Architectures-for-Deep-RL.html index 7bfc2c12..21acd720 100644 --- a/Gossip-based-Actor-Learner-Architectures-for-Deep-RL.html +++ b/Gossip-based-Actor-Learner-Architectures-for-Deep-RL.html @@ -159,7 +159,7 @@ @@ -253,9 +253,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/GradNorm-Gradient-Normalization-for-Adaptive-Loss-Balancing-in-Deep-Multitask-Networks.html b/GradNorm-Gradient-Normalization-for-Adaptive-Loss-Balancing-in-Deep-Multitask-Networks.html index fdc13f41..2b5a3dff 100644 --- a/GradNorm-Gradient-Normalization-for-Adaptive-Loss-Balancing-in-Deep-Multitask-Networks.html +++ b/GradNorm-Gradient-Normalization-for-Adaptive-Loss-Balancing-in-Deep-Multitask-Networks.html @@ -159,7 +159,7 @@ @@ -290,9 +290,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Gradient-Surgery-for-Multi-Task-Learning.html b/Gradient-Surgery-for-Multi-Task-Learning.html index dd7046b6..0e562cca 100644 --- a/Gradient-Surgery-for-Multi-Task-Learning.html +++ b/Gradient-Surgery-for-Multi-Task-Learning.html @@ -159,7 +159,7 @@ @@ -304,9 +304,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Gradient-based-sample-selection-for-online-continual-learning.html b/Gradient-based-sample-selection-for-online-continual-learning.html index 25c92bbf..61ed5113 100644 --- a/Gradient-based-sample-selection-for-online-continual-learning.html +++ b/Gradient-based-sample-selection-for-online-continual-learning.html @@ -159,7 +159,7 @@ @@ -313,9 +313,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/HARP-Hierarchical-Representation-Learning-for-Networks.html b/HARP-Hierarchical-Representation-Learning-for-Networks.html index e49e3f73..9d069f58 100644 --- a/HARP-Hierarchical-Representation-Learning-for-Networks.html +++ b/HARP-Hierarchical-Representation-Learning-for-Networks.html @@ -159,7 +159,7 @@ @@ -246,9 +246,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Hamiltonian-Neural-Networks.html b/Hamiltonian-Neural-Networks.html index a9aac38f..d70c8213 100644 --- a/Hamiltonian-Neural-Networks.html +++ b/Hamiltonian-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -270,9 +270,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Harvest,-Yield,-and-Scalable-Tolerant-Systems.html b/Harvest,-Yield,-and-Scalable-Tolerant-Systems.html index 17715a66..6687739c 100644 --- a/Harvest,-Yield,-and-Scalable-Tolerant-Systems.html +++ b/Harvest,-Yield,-and-Scalable-Tolerant-Systems.html @@ -159,7 +159,7 @@ @@ -273,9 +273,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Hierarchical-Graph-Representation-Learning-with-Differentiable-Pooling.html b/Hierarchical-Graph-Representation-Learning-with-Differentiable-Pooling.html index 5db47cff..1df7e780 100644 --- a/Hierarchical-Graph-Representation-Learning-with-Differentiable-Pooling.html +++ b/Hierarchical-Graph-Representation-Learning-with-Differentiable-Pooling.html @@ -159,7 +159,7 @@ @@ -324,9 +324,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Hierarchical-RL-Using-an-Ensemble-of-Proprioceptive-Periodic-Policies.html b/Hierarchical-RL-Using-an-Ensemble-of-Proprioceptive-Periodic-Policies.html index f93544cf..041e59ad 100644 --- a/Hierarchical-RL-Using-an-Ensemble-of-Proprioceptive-Periodic-Policies.html +++ b/Hierarchical-RL-Using-an-Ensemble-of-Proprioceptive-Periodic-Policies.html @@ -159,7 +159,7 @@ @@ -298,9 +298,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Higher-order-organization-of-complex-networks.html b/Higher-order-organization-of-complex-networks.html index b4e0bfdc..4bbccb5c 100644 --- a/Higher-order-organization-of-complex-networks.html +++ b/Higher-order-organization-of-complex-networks.html @@ -159,7 +159,7 @@ @@ -253,9 +253,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Hindsight-Experience-Replay.html b/Hindsight-Experience-Replay.html index 5560fbcf..791dfa6a 100644 --- a/Hindsight-Experience-Replay.html +++ b/Hindsight-Experience-Replay.html @@ -159,7 +159,7 @@ @@ -267,9 +267,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/HoME-a-Household-Multimodal-Environment.html b/HoME-a-Household-Multimodal-Environment.html index b588499f..b94f3fda 100644 --- a/HoME-a-Household-Multimodal-Environment.html +++ b/HoME-a-Household-Multimodal-Environment.html @@ -159,7 +159,7 @@ @@ -294,9 +294,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/How-to-train-your-MAML.html b/How-to-train-your-MAML.html index a4ddbd65..c92654d9 100644 --- a/How-to-train-your-MAML.html +++ b/How-to-train-your-MAML.html @@ -159,7 +159,7 @@ @@ -282,9 +282,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/How-transferable-are-features-in-deep-neural-networks.html b/How-transferable-are-features-in-deep-neural-networks.html index afd291e6..d56bf76d 100644 --- a/How-transferable-are-features-in-deep-neural-networks.html +++ b/How-transferable-are-features-in-deep-neural-networks.html @@ -159,7 +159,7 @@ @@ -290,9 +290,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/HyperNetworks.html b/HyperNetworks.html index bf7fc70a..362d2a64 100644 --- a/HyperNetworks.html +++ b/HyperNetworks.html @@ -159,7 +159,7 @@ @@ -274,9 +274,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Imagination-Augmented-Agents-for-Deep-Reinforcement-Learning.html b/Imagination-Augmented-Agents-for-Deep-Reinforcement-Learning.html index b9827c2e..b6ec8c9b 100644 --- a/Imagination-Augmented-Agents-for-Deep-Reinforcement-Learning.html +++ b/Imagination-Augmented-Agents-for-Deep-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -273,9 +273,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Improving-Information-Extraction-by-Acquiring-External-Evidence-with-Reinforcement-Learning.html b/Improving-Information-Extraction-by-Acquiring-External-Evidence-with-Reinforcement-Learning.html index 5e3119e0..d2121df1 100644 --- a/Improving-Information-Extraction-by-Acquiring-External-Evidence-with-Reinforcement-Learning.html +++ b/Improving-Information-Extraction-by-Acquiring-External-Evidence-with-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -311,9 +311,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Kronecker-Recurrent-Units.html b/Kronecker-Recurrent-Units.html index 2b1bd236..6761d0f1 100644 --- a/Kronecker-Recurrent-Units.html +++ b/Kronecker-Recurrent-Units.html @@ -159,7 +159,7 @@ @@ -347,9 +347,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Large-Memory-Layers-with-Product-Keys.html b/Large-Memory-Layers-with-Product-Keys.html index 6050b548..8bc05b1d 100644 --- a/Large-Memory-Layers-with-Product-Keys.html +++ b/Large-Memory-Layers-with-Product-Keys.html @@ -159,7 +159,7 @@ @@ -296,9 +296,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Learned-Optimizers-that-Scale-and-Generalize.html b/Learned-Optimizers-that-Scale-and-Generalize.html index 46de6169..6ed5b0d5 100644 --- a/Learned-Optimizers-that-Scale-and-Generalize.html +++ b/Learned-Optimizers-that-Scale-and-Generalize.html @@ -159,7 +159,7 @@ @@ -261,9 +261,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Learning-Explanations-That-Are-Hard-To-Vary.html b/Learning-Explanations-That-Are-Hard-To-Vary.html index f63a6e16..2b4ec987 100644 --- a/Learning-Explanations-That-Are-Hard-To-Vary.html +++ b/Learning-Explanations-That-Are-Hard-To-Vary.html @@ -159,7 +159,7 @@ @@ -277,9 +277,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Learning-Independent-Causal-Mechanisms.html b/Learning-Independent-Causal-Mechanisms.html index 22f8da09..1d6f2de1 100644 --- a/Learning-Independent-Causal-Mechanisms.html +++ b/Learning-Independent-Causal-Mechanisms.html @@ -159,7 +159,7 @@ @@ -315,9 +315,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Learning-a-SAT-Solver-from-Single-Bit-Supervision.html b/Learning-a-SAT-Solver-from-Single-Bit-Supervision.html index 988defc6..856a2b12 100644 --- a/Learning-a-SAT-Solver-from-Single-Bit-Supervision.html +++ b/Learning-a-SAT-Solver-from-Single-Bit-Supervision.html @@ -159,7 +159,7 @@ @@ -286,9 +286,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Learning-to-Compute-Word-Embeddings-On-the-Fly.html b/Learning-to-Compute-Word-Embeddings-On-the-Fly.html index 5aff02dc..b10a64a1 100644 --- a/Learning-to-Compute-Word-Embeddings-On-the-Fly.html +++ b/Learning-to-Compute-Word-Embeddings-On-the-Fly.html @@ -159,7 +159,7 @@ @@ -270,9 +270,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Learning-to-Count-Objects-in-Natural-Images-for-Visual-Question-Answering.html b/Learning-to-Count-Objects-in-Natural-Images-for-Visual-Question-Answering.html index 6bedefa9..46ea69b0 100644 --- a/Learning-to-Count-Objects-in-Natural-Images-for-Visual-Question-Answering.html +++ b/Learning-to-Count-Objects-in-Natural-Images-for-Visual-Question-Answering.html @@ -159,7 +159,7 @@ @@ -265,9 +265,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Linguistic-Knowledge-as-Memory-for-Recurrent-Neural-Networks.html b/Linguistic-Knowledge-as-Memory-for-Recurrent-Neural-Networks.html index 4af0b113..09be790c 100644 --- a/Linguistic-Knowledge-as-Memory-for-Recurrent-Neural-Networks.html +++ b/Linguistic-Knowledge-as-Memory-for-Recurrent-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -250,9 +250,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/MONet-Unsupervised-Scene-Decomposition-and-Representation.html b/MONet-Unsupervised-Scene-Decomposition-and-Representation.html index 1823b6fc..1f81afa1 100644 --- a/MONet-Unsupervised-Scene-Decomposition-and-Representation.html +++ b/MONet-Unsupervised-Scene-Decomposition-and-Representation.html @@ -159,7 +159,7 @@ @@ -282,9 +282,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Making-the-V-in-VQA-Matter-Elevating-the-Role-of-Image-Understanding-in-Visual-Question-Answering.html b/Making-the-V-in-VQA-Matter-Elevating-the-Role-of-Image-Understanding-in-Visual-Question-Answering.html index 6724876c..e815ad86 100644 --- a/Making-the-V-in-VQA-Matter-Elevating-the-Role-of-Image-Understanding-in-Visual-Question-Answering.html +++ b/Making-the-V-in-VQA-Matter-Elevating-the-Role-of-Image-Understanding-in-Visual-Question-Answering.html @@ -159,7 +159,7 @@ @@ -229,9 +229,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Massively-Multilingual-Neural-Machine-Translation-in-the-Wild-Findings-and-Challenges.html b/Massively-Multilingual-Neural-Machine-Translation-in-the-Wild-Findings-and-Challenges.html index 54c2bb28..7c8ad86d 100644 --- a/Massively-Multilingual-Neural-Machine-Translation-in-the-Wild-Findings-and-Challenges.html +++ b/Massively-Multilingual-Neural-Machine-Translation-in-the-Wild-Findings-and-Challenges.html @@ -159,7 +159,7 @@ @@ -370,9 +370,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Mastering-Atari,-Go,-Chess-and-Shogi-by-Planning-with-a-Learned-Model.html b/Mastering-Atari,-Go,-Chess-and-Shogi-by-Planning-with-a-Learned-Model.html index 0a41d683..78940be8 100644 --- a/Mastering-Atari,-Go,-Chess-and-Shogi-by-Planning-with-a-Learned-Model.html +++ b/Mastering-Atari,-Go,-Chess-and-Shogi-by-Planning-with-a-Learned-Model.html @@ -159,7 +159,7 @@ @@ -312,9 +312,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Measuring-Abstract-Reasoning-in-Neural-Networks.html b/Measuring-Abstract-Reasoning-in-Neural-Networks.html index a2911d64..cd1bff3b 100644 --- a/Measuring-Abstract-Reasoning-in-Neural-Networks.html +++ b/Measuring-Abstract-Reasoning-in-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -356,9 +356,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Memory-Based-Parameter-Adaption.html b/Memory-Based-Parameter-Adaption.html index fbce13fa..59ccefb4 100644 --- a/Memory-Based-Parameter-Adaption.html +++ b/Memory-Based-Parameter-Adaption.html @@ -159,7 +159,7 @@ @@ -337,9 +337,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Meta-Learning-Update-Rules-for-Unsupervised-Representation-Learning.html b/Meta-Learning-Update-Rules-for-Unsupervised-Representation-Learning.html index 432b6a1a..a126e8c7 100644 --- a/Meta-Learning-Update-Rules-for-Unsupervised-Representation-Learning.html +++ b/Meta-Learning-Update-Rules-for-Unsupervised-Representation-Learning.html @@ -159,7 +159,7 @@ @@ -313,9 +313,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Meta-Reinforcement-Learning-of-Structured-Exploration-Strategies.html b/Meta-Reinforcement-Learning-of-Structured-Exploration-Strategies.html index e18c665f..9d50c46a 100644 --- a/Meta-Reinforcement-Learning-of-Structured-Exploration-Strategies.html +++ b/Meta-Reinforcement-Learning-of-Structured-Exploration-Strategies.html @@ -159,7 +159,7 @@ @@ -283,9 +283,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Model-Primitive-Hierarchical-Lifelong-Reinforcement-Learning.html b/Model-Primitive-Hierarchical-Lifelong-Reinforcement-Learning.html index 559f8a9d..15a2c127 100644 --- a/Model-Primitive-Hierarchical-Lifelong-Reinforcement-Learning.html +++ b/Model-Primitive-Hierarchical-Lifelong-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -355,9 +355,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Modular-meta-learning.html b/Modular-meta-learning.html index 8ac6ac07..da24f581 100644 --- a/Modular-meta-learning.html +++ b/Modular-meta-learning.html @@ -159,7 +159,7 @@ @@ -387,9 +387,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Multiple-Model-Based-Reinforcement-Learning.html b/Multiple-Model-Based-Reinforcement-Learning.html index fadcdae7..19ff1ef3 100644 --- a/Multiple-Model-Based-Reinforcement-Learning.html +++ b/Multiple-Model-Based-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -247,9 +247,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Net2Net-Accelerating-Learning-via-Knowledge-Transfer.html b/Net2Net-Accelerating-Learning-via-Knowledge-Transfer.html index e6962305..c2f9d4e9 100644 --- a/Net2Net-Accelerating-Learning-via-Knowledge-Transfer.html +++ b/Net2Net-Accelerating-Learning-via-Knowledge-Transfer.html @@ -159,7 +159,7 @@ @@ -260,9 +260,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Network-Motifs-Simple-Building-Blocks-of-Complex-Networks.html b/Network-Motifs-Simple-Building-Blocks-of-Complex-Networks.html index fe70e52b..7f8a6662 100644 --- a/Network-Motifs-Simple-Building-Blocks-of-Complex-Networks.html +++ b/Network-Motifs-Simple-Building-Blocks-of-Complex-Networks.html @@ -159,7 +159,7 @@ @@ -225,9 +225,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Network-Randomization-A-Simple-Technique-for-Generalization-in-Deep-Reinforcement-Learning.html b/Network-Randomization-A-Simple-Technique-for-Generalization-in-Deep-Reinforcement-Learning.html index 27c5d6d3..afa67553 100644 --- a/Network-Randomization-A-Simple-Technique-for-Generalization-in-Deep-Reinforcement-Learning.html +++ b/Network-Randomization-A-Simple-Technique-for-Generalization-in-Deep-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -269,9 +269,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Neural-Message-Passing-for-Quantum-Chemistry.html b/Neural-Message-Passing-for-Quantum-Chemistry.html index 602aacef..44512089 100644 --- a/Neural-Message-Passing-for-Quantum-Chemistry.html +++ b/Neural-Message-Passing-for-Quantum-Chemistry.html @@ -159,7 +159,7 @@ @@ -353,9 +353,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Neural-Module-Networks.html b/Neural-Module-Networks.html index 2e5e190b..8132f6ed 100644 --- a/Neural-Module-Networks.html +++ b/Neural-Module-Networks.html @@ -159,7 +159,7 @@ @@ -265,9 +265,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Neural-Relational-Inference-for-Interacting-Systems.html b/Neural-Relational-Inference-for-Interacting-Systems.html index e614b4cb..9c0e0cc8 100644 --- a/Neural-Relational-Inference-for-Interacting-Systems.html +++ b/Neural-Relational-Inference-for-Interacting-Systems.html @@ -159,7 +159,7 @@ @@ -288,9 +288,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Observational-Overfitting-in-Reinforcement-Learning.html b/Observational-Overfitting-in-Reinforcement-Learning.html index 327d713a..9ecc42c9 100644 --- a/Observational-Overfitting-in-Reinforcement-Learning.html +++ b/Observational-Overfitting-in-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -325,9 +325,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/On-the-Difficulty-of-Warm-Starting-Neural-Network-Training.html b/On-the-Difficulty-of-Warm-Starting-Neural-Network-Training.html index 9067c9a1..95fe0f48 100644 --- a/On-the-Difficulty-of-Warm-Starting-Neural-Network-Training.html +++ b/On-the-Difficulty-of-Warm-Starting-Neural-Network-Training.html @@ -159,7 +159,7 @@ @@ -327,9 +327,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/One-Model-To-Learn-Them-All.html b/One-Model-To-Learn-Them-All.html index 69c1a892..f819b729 100644 --- a/One-Model-To-Learn-Them-All.html +++ b/One-Model-To-Learn-Them-All.html @@ -159,7 +159,7 @@ @@ -368,9 +368,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/One-Solution-is-Not-All-You-Need-Few-Shot-Extrapolation-via-Structured-MaxEnt-RL.html b/One-Solution-is-Not-All-You-Need-Few-Shot-Extrapolation-via-Structured-MaxEnt-RL.html index 9de6b7c7..b9912531 100644 --- a/One-Solution-is-Not-All-You-Need-Few-Shot-Extrapolation-via-Structured-MaxEnt-RL.html +++ b/One-Solution-is-Not-All-You-Need-Few-Shot-Extrapolation-via-Structured-MaxEnt-RL.html @@ -159,7 +159,7 @@ @@ -310,9 +310,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/One-shot-Learning-with-Memory-Augmented-Neural-Networks.html b/One-shot-Learning-with-Memory-Augmented-Neural-Networks.html index 9a0561df..294e295c 100644 --- a/One-shot-Learning-with-Memory-Augmented-Neural-Networks.html +++ b/One-shot-Learning-with-Memory-Augmented-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -312,9 +312,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Outrageously-Large-Neural-Networks-The-Sparsely-Gated-Mixture-of-Experts-Layer.html b/Outrageously-Large-Neural-Networks-The-Sparsely-Gated-Mixture-of-Experts-Layer.html index 8e6ff74a..ef5bdf72 100644 --- a/Outrageously-Large-Neural-Networks-The-Sparsely-Gated-Mixture-of-Experts-Layer.html +++ b/Outrageously-Large-Neural-Networks-The-Sparsely-Gated-Mixture-of-Experts-Layer.html @@ -159,7 +159,7 @@ @@ -334,9 +334,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/PHYRE-A-New-Benchmark-for-Physical-Reasoning.html b/PHYRE-A-New-Benchmark-for-Physical-Reasoning.html index 0aec0e60..fe6953f3 100644 --- a/PHYRE-A-New-Benchmark-for-Physical-Reasoning.html +++ b/PHYRE-A-New-Benchmark-for-Physical-Reasoning.html @@ -159,7 +159,7 @@ @@ -355,9 +355,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/PTE-Predictive-Text-Embedding-through-Large-scale-Heterogeneous-Text-Networks.html b/PTE-Predictive-Text-Embedding-through-Large-scale-Heterogeneous-Text-Networks.html index 62820c48..47841bc7 100644 --- a/PTE-Predictive-Text-Embedding-through-Large-scale-Heterogeneous-Text-Networks.html +++ b/PTE-Predictive-Text-Embedding-through-Large-scale-Heterogeneous-Text-Networks.html @@ -159,7 +159,7 @@ @@ -288,9 +288,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Poincare-Embeddings-for-Learning-Hierarchical-Representations.html b/Poincare-Embeddings-for-Learning-Hierarchical-Representations.html index 7e96524e..6e040b44 100644 --- a/Poincare-Embeddings-for-Learning-Hierarchical-Representations.html +++ b/Poincare-Embeddings-for-Learning-Hierarchical-Representations.html @@ -159,7 +159,7 @@ @@ -321,9 +321,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Pointer-Networks.html b/Pointer-Networks.html index 4c7fcd53..fa354a43 100644 --- a/Pointer-Networks.html +++ b/Pointer-Networks.html @@ -159,7 +159,7 @@ @@ -255,9 +255,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Practical-Lessons-from-Predicting-Clicks-on-Ads-at-Facebook.html b/Practical-Lessons-from-Predicting-Clicks-on-Ads-at-Facebook.html index df43e04b..d5736553 100644 --- a/Practical-Lessons-from-Predicting-Clicks-on-Ads-at-Facebook.html +++ b/Practical-Lessons-from-Predicting-Clicks-on-Ads-at-Facebook.html @@ -159,7 +159,7 @@ @@ -371,9 +371,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Pre-training-Graph-Neural-Networks-with-Kernels.html b/Pre-training-Graph-Neural-Networks-with-Kernels.html index 79454862..46b8be1d 100644 --- a/Pre-training-Graph-Neural-Networks-with-Kernels.html +++ b/Pre-training-Graph-Neural-Networks-with-Kernels.html @@ -159,7 +159,7 @@ @@ -264,9 +264,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Principled-Detection-of-Out-of-Distribution-Examples-in-Neural-Networks.html b/Principled-Detection-of-Out-of-Distribution-Examples-in-Neural-Networks.html index 014f7123..649c1757 100644 --- a/Principled-Detection-of-Out-of-Distribution-Examples-in-Neural-Networks.html +++ b/Principled-Detection-of-Out-of-Distribution-Examples-in-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -311,9 +311,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Quantifying-Generalization-in-Reinforcement-Learning.html b/Quantifying-Generalization-in-Reinforcement-Learning.html index 159e39ad..24472777 100644 --- a/Quantifying-Generalization-in-Reinforcement-Learning.html +++ b/Quantifying-Generalization-in-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -319,9 +319,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/R-NET-Machine-Reading-Comprehension-with-Self-matching-Networks.html b/R-NET-Machine-Reading-Comprehension-with-Self-matching-Networks.html index 72ad4c35..a875ced3 100644 --- a/R-NET-Machine-Reading-Comprehension-with-Self-matching-Networks.html +++ b/R-NET-Machine-Reading-Comprehension-with-Self-matching-Networks.html @@ -159,7 +159,7 @@ @@ -281,9 +281,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Rapid-Learning-or-Feature-Reuse-Towards-Understanding-the-Effectiveness-of-MAML.html b/Rapid-Learning-or-Feature-Reuse-Towards-Understanding-the-Effectiveness-of-MAML.html index 90a17257..57a1c51c 100644 --- a/Rapid-Learning-or-Feature-Reuse-Towards-Understanding-the-Effectiveness-of-MAML.html +++ b/Rapid-Learning-or-Feature-Reuse-Towards-Understanding-the-Effectiveness-of-MAML.html @@ -159,7 +159,7 @@ @@ -332,9 +332,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Reading-Wikipedia-to-Answer-Open-Domain-Questions.html b/Reading-Wikipedia-to-Answer-Open-Domain-Questions.html index 33a9c218..f1dc2bd1 100644 --- a/Reading-Wikipedia-to-Answer-Open-Domain-Questions.html +++ b/Reading-Wikipedia-to-Answer-Open-Domain-Questions.html @@ -159,7 +159,7 @@ @@ -265,9 +265,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/ReasoNet-Learning-to-Stop-Reading-in-Machine-Comprehension.html b/ReasoNet-Learning-to-Stop-Reading-in-Machine-Comprehension.html index 6f80ebbb..4fe04e8c 100644 --- a/ReasoNet-Learning-to-Stop-Reading-in-Machine-Comprehension.html +++ b/ReasoNet-Learning-to-Stop-Reading-in-Machine-Comprehension.html @@ -159,7 +159,7 @@ @@ -320,9 +320,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Refining-Source-Representations-with-Relation-Networks-for-Neural-Machine-Translation.html b/Refining-Source-Representations-with-Relation-Networks-for-Neural-Machine-Translation.html index 99e72c2f..06de16da 100644 --- a/Refining-Source-Representations-with-Relation-Networks-for-Neural-Machine-Translation.html +++ b/Refining-Source-Representations-with-Relation-Networks-for-Neural-Machine-Translation.html @@ -159,7 +159,7 @@ @@ -276,9 +276,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Relational-Reinforcement-Learning.html b/Relational-Reinforcement-Learning.html index 84a6dd06..786ce34c 100644 --- a/Relational-Reinforcement-Learning.html +++ b/Relational-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -312,9 +312,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Remembering-for-the-Right-Reasons-Explanations-Reduce-Catastrophic-Forgetting.html b/Remembering-for-the-Right-Reasons-Explanations-Reduce-Catastrophic-Forgetting.html index d2f5ddc2..a51729c6 100644 --- a/Remembering-for-the-Right-Reasons-Explanations-Reduce-Catastrophic-Forgetting.html +++ b/Remembering-for-the-Right-Reasons-Explanations-Reduce-Catastrophic-Forgetting.html @@ -159,7 +159,7 @@ @@ -254,9 +254,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Representation-Tradeoffs-for-Hyperbolic-Embeddings.html b/Representation-Tradeoffs-for-Hyperbolic-Embeddings.html index ce1e5d2a..4b5e40c9 100644 --- a/Representation-Tradeoffs-for-Hyperbolic-Embeddings.html +++ b/Representation-Tradeoffs-for-Hyperbolic-Embeddings.html @@ -159,7 +159,7 @@ @@ -372,9 +372,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Revisiting-Fundamentals-of-Experience-Replay.html b/Revisiting-Fundamentals-of-Experience-Replay.html index ce323de3..e0ef9d80 100644 --- a/Revisiting-Fundamentals-of-Experience-Replay.html +++ b/Revisiting-Fundamentals-of-Experience-Replay.html @@ -159,7 +159,7 @@ @@ -321,9 +321,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Revisiting-Semi-Supervised-Learning-with-Graph-Embeddings.html b/Revisiting-Semi-Supervised-Learning-with-Graph-Embeddings.html index 283721b6..15e86184 100644 --- a/Revisiting-Semi-Supervised-Learning-with-Graph-Embeddings.html +++ b/Revisiting-Semi-Supervised-Learning-with-Graph-Embeddings.html @@ -159,7 +159,7 @@ @@ -277,9 +277,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Searching-for-Build-Debt-Experiences-Managing-Technical-Debt-at-Google.html b/Searching-for-Build-Debt-Experiences-Managing-Technical-Debt-at-Google.html index ddac935c..afe366ec 100644 --- a/Searching-for-Build-Debt-Experiences-Managing-Technical-Debt-at-Google.html +++ b/Searching-for-Build-Debt-Experiences-Managing-Technical-Debt-at-Google.html @@ -159,7 +159,7 @@ @@ -331,9 +331,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Set-Transformer-A-Framework-for-Attention-based-Permutation-Invariant-Neural-Networks.html b/Set-Transformer-A-Framework-for-Attention-based-Permutation-Invariant-Neural-Networks.html index 5ff6e317..20676569 100644 --- a/Set-Transformer-A-Framework-for-Attention-based-Permutation-Invariant-Neural-Networks.html +++ b/Set-Transformer-A-Framework-for-Attention-based-Permutation-Invariant-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -294,9 +294,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Simple-Baseline-for-Visual-Question-Answering.html b/Simple-Baseline-for-Visual-Question-Answering.html index 9046e8d4..0c3942e1 100644 --- a/Simple-Baseline-for-Visual-Question-Answering.html +++ b/Simple-Baseline-for-Visual-Question-Answering.html @@ -159,7 +159,7 @@ @@ -225,9 +225,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Smooth-Loss-Functions-for-Deep-Top-k-Classification.html b/Smooth-Loss-Functions-for-Deep-Top-k-Classification.html index 5ae12ff1..8897f48c 100644 --- a/Smooth-Loss-Functions-for-Deep-Top-k-Classification.html +++ b/Smooth-Loss-Functions-for-Deep-Top-k-Classification.html @@ -159,7 +159,7 @@ @@ -308,9 +308,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/StarSpace-Embed-All-The-Things.html b/StarSpace-Embed-All-The-Things.html index 926be811..3bbfee59 100644 --- a/StarSpace-Embed-All-The-Things.html +++ b/StarSpace-Embed-All-The-Things.html @@ -159,7 +159,7 @@ @@ -248,9 +248,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Stylistic-Transfer-in-Natural-Language-Generation-Systems-Using-Recurrent-Neural-Networks.html b/Stylistic-Transfer-in-Natural-Language-Generation-Systems-Using-Recurrent-Neural-Networks.html index 84713dcd..2465c4c9 100644 --- a/Stylistic-Transfer-in-Natural-Language-Generation-Systems-Using-Recurrent-Neural-Networks.html +++ b/Stylistic-Transfer-in-Natural-Language-Generation-Systems-Using-Recurrent-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -239,9 +239,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Superposition-of-many-models-into-one.html b/Superposition-of-many-models-into-one.html index 7e8ee5de..8339a9bc 100644 --- a/Superposition-of-many-models-into-one.html +++ b/Superposition-of-many-models-into-one.html @@ -159,7 +159,7 @@ @@ -376,9 +376,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Supervised-Contrastive-Learning.html b/Supervised-Contrastive-Learning.html index 9259a134..88500268 100644 --- a/Supervised-Contrastive-Learning.html +++ b/Supervised-Contrastive-Learning.html @@ -159,7 +159,7 @@ @@ -301,9 +301,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Swish-A-self-gated-activation-function.html b/Swish-A-self-gated-activation-function.html index 13812477..56e10b63 100644 --- a/Swish-A-self-gated-activation-function.html +++ b/Swish-A-self-gated-activation-function.html @@ -159,7 +159,7 @@ @@ -236,9 +236,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Synthesized-Policies-for-Transfer-and-Adaptation-across-Tasks-and-Environments.html b/Synthesized-Policies-for-Transfer-and-Adaptation-across-Tasks-and-Environments.html index 6af90235..8ea213a9 100644 --- a/Synthesized-Policies-for-Transfer-and-Adaptation-across-Tasks-and-Environments.html +++ b/Synthesized-Policies-for-Transfer-and-Adaptation-across-Tasks-and-Environments.html @@ -159,7 +159,7 @@ @@ -383,9 +383,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/TASKNORM-Rethinking-Batch-Normalization-for-Meta-Learning.html b/TASKNORM-Rethinking-Batch-Normalization-for-Meta-Learning.html index 94095cff..f33257bc 100644 --- a/TASKNORM-Rethinking-Batch-Normalization-for-Meta-Learning.html +++ b/TASKNORM-Rethinking-Batch-Normalization-for-Meta-Learning.html @@ -159,7 +159,7 @@ @@ -359,9 +359,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Task-Oriented-Query-Reformulation-with-Reinforcement-Learning.html b/Task-Oriented-Query-Reformulation-with-Reinforcement-Learning.html index f1e78ae0..45162c91 100644 --- a/Task-Oriented-Query-Reformulation-with-Reinforcement-Learning.html +++ b/Task-Oriented-Query-Reformulation-with-Reinforcement-Learning.html @@ -159,7 +159,7 @@ @@ -305,9 +305,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/The-Lottery-Ticket-Hypothesis-Training-Pruned-Neural-Networks.html b/The-Lottery-Ticket-Hypothesis-Training-Pruned-Neural-Networks.html index c21704af..29f8b3af 100644 --- a/The-Lottery-Ticket-Hypothesis-Training-Pruned-Neural-Networks.html +++ b/The-Lottery-Ticket-Hypothesis-Training-Pruned-Neural-Networks.html @@ -159,7 +159,7 @@ @@ -263,9 +263,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/The-Tail-at-Scale.html b/The-Tail-at-Scale.html index bdf2ebd7..9870e301 100644 --- a/The-Tail-at-Scale.html +++ b/The-Tail-at-Scale.html @@ -159,7 +159,7 @@ @@ -375,9 +375,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/To-Tune-or-Not-to-Tune-Adapting-Pretrained-Representations-to-Diverse-Tasks.html b/To-Tune-or-Not-to-Tune-Adapting-Pretrained-Representations-to-Diverse-Tasks.html index 07e95b64..30b12d0d 100644 --- a/To-Tune-or-Not-to-Tune-Adapting-Pretrained-Representations-to-Diverse-Tasks.html +++ b/To-Tune-or-Not-to-Tune-Adapting-Pretrained-Representations-to-Diverse-Tasks.html @@ -159,7 +159,7 @@ @@ -337,9 +337,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Toolformer-Language-Models-Can-Teach-Themselves-to-Use-Tools.html b/Toolformer-Language-Models-Can-Teach-Themselves-to-Use-Tools.html new file mode 100644 index 00000000..7efa3fed --- /dev/null +++ b/Toolformer-Language-Models-Can-Teach-Themselves-to-Use-Tools.html @@ -0,0 +1,488 @@ + + + + + + + + + + + + + + + + + Toolformer - Language Models Can Teach Themselves to Use Tools · Papers I Read + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
    +
    +
    +

    + Papers I Read + Notes and Summaries +

    +
    +
    + +
    +
    +

    Toolformer - Language Models Can Teach Themselves to Use Tools

    + + +

    Introduction

    + +
      +
    • +

      The paper presents Toolformer, a language model that uses simple APIs to use external tools (calculator, QA system, search engine, translation system, and calendar).

      +
    • +
    • +

      Link to the paper

      +
    • +
    + +

    Approach

    + +
      +
    • +

      Starting with a language model, M, the goal is to enable the language model to use tools by invoking API calls.

      +
    • +
    • +

      An API call is denoted by the tuple $c = (api_name, api_input)$. It can be linearized as $e(c) = [api_name(api_input)]$ or as $e(c, r) = [api_name(api_input) -> r]$ where $r$ denotes the result of the API.

      +
    • +
    • +

      The given dataset of plain text, $C$, is converted into a dataset $C*$ augmented with the API calls using a three-step process.

      +
    • +
    • +

      In the first step, a position ($i$) and API call candidates (for the position $i$) are sampled.

      + +
        +
      • +

        Positions are sampled by (i) computing the probability that M assigns to starting an API call for each position and (ii) retaining the top-$k$ positions with a probability greater than a threshold value.

        +
      • +
      • +

        For each of the sampled positions (say $i$), API calls are sampled by concatenating a prompt to the tokens till index $i$ and sampling from the model M. Examples that do not generate the “end of the API” token (i.e.,”]”) are discarded.

        +
      • +
      +
    • +
    • +

      In the second step, the API calls are executed to obtain response $r$ (text sequence).

      + +
        +
      • API calls are filtered using the following criteria: if providing M with both the input and the output of the API makes it easier for M to predict the future token, compared to not using the API call at all or just using the input to the API, then the API call is helpful for M, and the example should be retained.
      • +
      +
    • +
    • +

      In the last step, the remaining API calls are merged to obtain the augmented dataset $C*$ that is used for finetuning M.

      +
    • +
    • +

      Note that $C*$ contains $C$, so M is finetuned on the original dataset and examples where a tool is helpful.

      +
    • +
    • +

      During inference, the model is used for decoding in the usual way. Decoding is stopped when it produces the “->” token, and the corresponding API is used to generate the response. The decoding process (using the model) resumes with the API output appended to the decoded text.

      +
    • +
    + +

    Tools

    + +
      +
    • +

      There are two constraints on the tools: (i) their input and output should be expressible as text, and (ii) few demonstrations can be obtained from the tools. The second constraint means that the tool should be useable or accessible.

      +
    • +
    • +

      The paper considered the following tools: a question-answering system, a Wikipedia search engine, a calculator, a calendar, and a machine translation system. Of these, only the calculator and calendar are non-neural network tools.

      +
    • +
    + +

    Experiments

    + +
      +
    • +

      Subset of CCNet is used as the language modeling dataset.

      +
    • +
    • +

      GPT-J is used as the language model.

      +
    • +
    • +

      For finetuning, the batch size is 128, the learning rate is 1e-5, and a linear warmup for the first 10% of training is used.

      +
    • +
    • +

      Following models are compared:

      + +
        +
      • +

        GPT-J: Regular GPT-J model without any finetuning.

        +
      • +
      • +

        GPT-J + CC: GPT-J finetuned on $C$ without any API calls.

        +
      • +
      • +

        Toolformer, i.e. GPT-J finetuned on $C*$.

        +
      • +
      • +

        Toolformer with API calls disabled during training.

        +
      • +
      • +

        OPT 66B

        +
      • +
      • +

        GPT-3

        +
      • +
      +
    • +
    • +

      The models are evaluated in the prompted zero-shot setup, where models are instructed to solve a task without any in-context examples.

      +
    • +
    • +

      One difference from the standard greedy decoding is that the API call is used whenever it is one of the top-10 most likely next tokens. This is done to increase the use of API calls.

      +
    • +
    • +

      Evaluation Tasks

      + +
        +
      • +

        SQuAD, GoogleRE, and T-REx subsets of the LAMA benchmark where the model has to complete a short statement with a missing fact.

        + +
          +
        • +

          Since LAMA questions are based on Wikipedia, Toolformer isn’t allowed to use Wikipedia search.

          +
        • +
        • +

          The evaluation criteria is to check if the correct word is among the first five words predicted by the model.

          +
        • +
        • +

          Toolformer uses the question-answering tool for most cases, outperforming all the baselines.

          +
        • +
        +
      • +
      • +

        Math Dataset

        + +
          +
        • +

          eSDiv, SVAMP, and MAWPS benchmarks.

          +
        • +
        • +

          The first number predicted by the model is considered to be the output.

          +
        • +
        • +

          Toolformer uses the calculator tool for most cases, thereby outperforming all the baselines.

          +
        • +
        +
      • +
      • +

        Question Answering

        + +
          +
        • +

          Web Questions, Natural Questions, and TriviaQA datasets.

          +
        • +
        • +

          The evaluation criteria is to check if the correct word is among the first 20 words predicted by the model.

          +
        • +
        • +

          Question Answering tool is disabled for this setup.

          +
        • +
        • +

          Toolformer uses the Wikipedia tool for most cases, thereby outperforming all the baselines other than the much larger GPT-3 model.

          +
        • +
        +
      • +
      • +

        Multilingual Question Answering

        + +
          +
        • +

          MLQA benchmark.

          +
        • +
        • +

          The evaluation criteria is to check if the correct word is among the first ten words predicted by the model.

          +
        • +
        • +

          Toolformer uses the translation tool for most of the questions, with questions in Hindi being an exception.

          +
        • +
        • +

          However, Toolformer does not consistently outperform the GPT-J baseline, likely because, for some languages, finetuning on CCNet could hurt performance.

          +
        • +
        +
      • +
      • +

        Temporal Datasets

        + +
          +
        • +

          TEMPLAMA (cloze style queries where the answer changes with time) and DATESET (dataset generated through a series of templates and populated with random dates/durations).

          +
        • +
        • +

          While Toolformer outperforms the baselines for both datasets, it relies on the Wikipedia search and Question Answering tools (and not the calendar tool) for the LAMA dataset. On the DATESET dataset, it uses the calendar tool in the majority.

          +
        • +
        +
      • +
      • +

        Language Modeling

        + +
          +
        • +

          WikiText and a subset of 10,000 randomly selected documents from CCNet (not used during training of M).

          +
        • +
        • +

          Training on $C*$ does not increase perplexity (compared to training on C). In this experiment, the API calls are disabled during inference.

          +
        • +
        +
      • +
      +
    • +
    • +

      Varying the size of the underlying models show that the ability to use tools emerges only around 755M parameters.

      +
    • +
    + +

    Future Work

    + +
      +
    • +

      Extending Toolformer to chain the use of tools and use tools interactively.

      +
    • +
    • +

      In some cases, the use of tools is very sample-inefficient.

      +
    • +
    • +

      Decision to use a tool does not account for the cost of using the tool.

      +
    • +
    + +
    + + +
    +
    + + + + +
    + + + + + + + + diff --git a/Towards-a-Unified-Theory-of-State-Abstraction-for-MDPs.html b/Towards-a-Unified-Theory-of-State-Abstraction-for-MDPs.html index fc942447..1830005d 100644 --- a/Towards-a-Unified-Theory-of-State-Abstraction-for-MDPs.html +++ b/Towards-a-Unified-Theory-of-State-Abstraction-for-MDPs.html @@ -159,7 +159,7 @@ @@ -315,9 +315,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Towards-a-natural-benchmark-for-continual-learning.html b/Towards-a-natural-benchmark-for-continual-learning.html index 2fc57746..cf5e4619 100644 --- a/Towards-a-natural-benchmark-for-continual-learning.html +++ b/Towards-a-natural-benchmark-for-continual-learning.html @@ -159,7 +159,7 @@ @@ -242,9 +242,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/TuckER-Tensor-Factorization-for-Knowledge-Graph-Completion.html b/TuckER-Tensor-Factorization-for-Knowledge-Graph-Completion.html index c281e16b..78a074ee 100644 --- a/TuckER-Tensor-Factorization-for-Knowledge-Graph-Completion.html +++ b/TuckER-Tensor-Factorization-for-Knowledge-Graph-Completion.html @@ -159,7 +159,7 @@ @@ -325,9 +325,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Two-Stage-Synthesis-Networks-for-Transfer-Learning-in-Machine-Comprehension.html b/Two-Stage-Synthesis-Networks-for-Transfer-Learning-in-Machine-Comprehension.html index 8b970550..3691585d 100644 --- a/Two-Stage-Synthesis-Networks-for-Transfer-Learning-in-Machine-Comprehension.html +++ b/Two-Stage-Synthesis-Networks-for-Transfer-Learning-in-Machine-Comprehension.html @@ -159,7 +159,7 @@ @@ -289,9 +289,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Two-Too-Simple-Adaptations-of-Word2Vec-for-Syntax-Problems.html b/Two-Too-Simple-Adaptations-of-Word2Vec-for-Syntax-Problems.html index 60e7199b..823e587a 100644 --- a/Two-Too-Simple-Adaptations-of-Word2Vec-for-Syntax-Problems.html +++ b/Two-Too-Simple-Adaptations-of-Word2Vec-for-Syntax-Problems.html @@ -159,7 +159,7 @@ @@ -200,9 +200,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Unsupervised-Learning-By-Predicting-Noise.html b/Unsupervised-Learning-By-Predicting-Noise.html index 2725b250..5a1ed510 100644 --- a/Unsupervised-Learning-By-Predicting-Noise.html +++ b/Unsupervised-Learning-By-Predicting-Noise.html @@ -159,7 +159,7 @@ @@ -338,9 +338,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/VQA-Visual-Question-Answering.html b/VQA-Visual-Question-Answering.html index e254db92..142b9072 100644 --- a/VQA-Visual-Question-Answering.html +++ b/VQA-Visual-Question-Answering.html @@ -159,7 +159,7 @@ @@ -297,9 +297,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/What-Does-Classifying-More-Than-10,000-Image-Categories-Tell-Us.html b/What-Does-Classifying-More-Than-10,000-Image-Categories-Tell-Us.html index e39f6c91..6325ec7d 100644 --- a/What-Does-Classifying-More-Than-10,000-Image-Categories-Tell-Us.html +++ b/What-Does-Classifying-More-Than-10,000-Image-Categories-Tell-Us.html @@ -159,7 +159,7 @@ @@ -235,9 +235,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/When-Do-Curricula-Work.html b/When-Do-Curricula-Work.html index 373856ca..d23edcff 100644 --- a/When-Do-Curricula-Work.html +++ b/When-Do-Curricula-Work.html @@ -159,7 +159,7 @@ @@ -305,9 +305,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/When-Recurrent-Models-Don-t-Need-To-Be-Recurrent.html b/When-Recurrent-Models-Don-t-Need-To-Be-Recurrent.html index 605faf51..23bd3ebd 100644 --- a/When-Recurrent-Models-Don-t-Need-To-Be-Recurrent.html +++ b/When-Recurrent-Models-Don-t-Need-To-Be-Recurrent.html @@ -159,7 +159,7 @@ @@ -253,9 +253,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/When-to-use-parametric-models-in-reinforcement-learning.html b/When-to-use-parametric-models-in-reinforcement-learning.html index c2b3d59b..d69dfb94 100644 --- a/When-to-use-parametric-models-in-reinforcement-learning.html +++ b/When-to-use-parametric-models-in-reinforcement-learning.html @@ -159,7 +159,7 @@ @@ -297,9 +297,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Word-Representations-via-Gaussian-Embedding.html b/Word-Representations-via-Gaussian-Embedding.html index 76b13ae8..b46053f9 100644 --- a/Word-Representations-via-Gaussian-Embedding.html +++ b/Word-Representations-via-Gaussian-Embedding.html @@ -159,7 +159,7 @@ @@ -253,9 +253,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Your-Classifier-is-Secretly-an-Energy-Based-Model,-and-You-Should-Treat-it-Like-One.html b/Your-Classifier-is-Secretly-an-Energy-Based-Model,-and-You-Should-Treat-it-Like-One.html index dece2f3a..a64297b7 100644 --- a/Your-Classifier-is-Secretly-an-Energy-Based-Model,-and-You-Should-Treat-it-Like-One.html +++ b/Your-Classifier-is-Secretly-an-Energy-Based-Model,-and-You-Should-Treat-it-Like-One.html @@ -159,7 +159,7 @@ @@ -303,9 +303,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/Zero-shot-Learning-by-Generating-Task-specific-Adapters.html b/Zero-shot-Learning-by-Generating-Task-specific-Adapters.html index a690ce20..cae6fd51 100644 --- a/Zero-shot-Learning-by-Generating-Task-specific-Adapters.html +++ b/Zero-shot-Learning-by-Generating-Task-specific-Adapters.html @@ -159,7 +159,7 @@ @@ -308,9 +308,9 @@

    Related Posts

  • - - Hints for Computer System Design - 07 Jan 2022 + + Toolformer - Language Models Can Teach Themselves to Use Tools + 10 Feb 2023

  • diff --git a/archieve.html b/archieve.html index e2870e8f..8ac7d4f9 100644 --- a/archieve.html +++ b/archieve.html @@ -159,7 +159,7 @@ @@ -184,7 +184,7 @@

    Blog Posts