learnables
diff --git a/‎.gitignore
+1 b/‎.gitignore
+1
diff --git a/‎.travis.yml
+51 b/‎.travis.yml
+51
diff --git a/‎README.md
+27-6 b/‎README.md
+27-6
diff --git a/‎docs/pydocmd.yml
+39-4 b/‎docs/pydocmd.yml
+39-4
diff --git a/‎docs/source/assets/img/halfcheetah.gif
4.09 MB b/‎docs/source/assets/img/halfcheetah.gif
4.09 MB
diff --git a/‎docs/source/tutorials/getting_started.md
+3 b/‎docs/source/tutorials/getting_started.md
+3
diff --git a/‎examples/maml_toy.py
+1-1 b/‎examples/maml_toy.py
+1-1
diff --git a/‎examples/rl/dist_promp.py
+1-1 b/‎examples/rl/dist_promp.py
+1-1
diff --git a/‎examples/rl/maml_dice.py
+1-1 b/‎examples/rl/maml_dice.py
+1-1
diff --git a/‎examples/rl/metasgd_a2c.py
+1-1 b/‎examples/rl/metasgd_a2c.py
+1-1
diff --git a/‎examples/rl/promp.py
+6-4 b/‎examples/rl/promp.py
+6-4
diff --git a/‎examples/vision/maml_miniimagenet.py
+5-5 b/‎examples/vision/maml_miniimagenet.py
+5-5
diff --git a/‎examples/vision/maml_omniglot.py
+5-5 b/‎examples/vision/maml_omniglot.py
+5-5
diff --git a/‎examples/vision/meta_mnist.py
+1-1 b/‎examples/vision/meta_mnist.py
+1-1
diff --git a/‎examples/vision/proto_net.py
+1-1 b/‎examples/vision/proto_net.py
+1-1
diff --git a/‎learn2learn/__init__.py
-2 b/‎learn2learn/__init__.py
-2
diff --git a/‎learn2learn/algorithms/__init__.py
+2-3 b/‎learn2learn/algorithms/__init__.py
+2-3
diff --git a/‎learn2learn/algorithms/dice.py
-9 b/‎learn2learn/algorithms/dice.py
-9
@@ -106,3 +106,4 @@ venv.bak/
 # mypy
 .mypy_cache/
 data/*
+docs/mkdocs.yml
@@ -0,0 +1,51 @@
+language: python
+
+os:
+    - linux
+
+python:
+    - 3.6
+    # - 3.7
+    - "3.6-dev"
+    - "3.7-dev"
+
+# matrix:
+#     include:
+#         - os: osx
+#           language: generic
+#           env: PYTHON=3.5.0
+#         - os: osx
+#           language: generic
+#           env: PYTHON=3.6.0
+#         - os: osx
+#           language: generic
+#           env: PYTHON=3.7.0
+
+before_install: |
+   if [ "$TRAVIS_OS_NAME" == "osx" ]; then
+     brew update
+     # Per the `pyenv homebrew recommendations <https://github.com/yyuu/pyenv/wiki#suggested-build-environment>`_.
+     brew install openssl readline
+     # See https://docs.travis-ci.com/user/osx-ci-environment/#A-note-on-upgrading-packages.
+     # I didn't do this above because it works and I'm lazy.
+     brew outdated pyenv || brew upgrade pyenv
+     # virtualenv doesn't work without pyenv knowledge. venv in Python 3.3
+     # doesn't provide Pip by default. So, use `pyenv-virtualenv <https://github.com/yyuu/pyenv-virtualenv/blob/master/README.md>`_.
+     brew install pyenv-virtualenv
+     pyenv install $PYTHON
+     # I would expect something like ``pyenv init; pyenv local $PYTHON`` or
+     # ``pyenv shell $PYTHON`` would work, but ``pyenv init`` doesn't seem to
+     # modify the Bash environment. ??? So, I hand-set the variables instead.
+     export PYENV_VERSION=$PYTHON
+     export PATH="/Users/travis/.pyenv/shims:${PATH}"
+     pyenv-virtualenv venv
+     source venv/bin/activate
+     # A manual check that the correct version of Python is running.
+     python --version
+   fi
+
+install: 
+    - pip install -U pip && pip install --progress-bar off -r requirements.txt && pip install pycodestyle
+
+script: 
+    - make tests
@@ -1,9 +1,30 @@
-<p align="center"><img src="https://raw.githubusercontent.com/seba-1511/learn2learn/gh-pages/assets/img/l2l-full.png" height="150px" /></p>
+<p align="center"><img src="https://raw.githubusercontent.com/seba-1511/learn2learn/gh-pages/assets/img/l2l-full.png" height="120px" /></p>
 
 --------------------------------------------------------------------------------
 
+[![Build Status](https://travis-ci.com/learnables/learn2learn.svg?branch=master)](https://travis-ci.com/learnables/learn2learn)
+
 learn2learn is a PyTorch library for meta-learning implementations.
-It was developed during the [first PyTorch Hackathon](http://pytorchmpk.devpost.com/).
+
+The goal of meta-learning is to enable agents to *learn how to learn*.
+That is, we would like our agents to become better learners as they solve more and more tasks.
+For example, the animation below shows an agent that learns to run after a only one parameter update.
+
+<p align="center"><img src="assets/img/halfcheetah.gif" height="250px" /></p>
+
+**Features**
+
+learn2learn provides high- and low-level utilities for meta-learning.
+The high-level utilities allow arbitrary users to take advantage of exisiting meta-learning algorithms.
+The low-level utilities enable researchers to develop new and better meta-learning algorithms.
+
+Some features of learn2learn include:
+
+* Modular API: implement your own training loops with our low-level utilities.
+* Provides various meta-learning algorithms (e.g. MAML, FOMAML, MetaSGD, ProtoNets, DiCE)
+* Task generator with unified API, compatible with torchvision, torchtext, torchaudio, and cherry.
+* Provides standardized meta-learning tasks for vision (Omniglot, mini-ImageNet), reinforcement learning (Particles, Mujoco), and even text (news classification).
+* 100% compatible with PyTorch -- use your own modules, datasets, or libraries!
 
 # Installation
 
@@ -14,7 +35,7 @@ pip install learn2learn
 # API Demo
 
 The following is an example of using the high-level MAML implementation on MNIST.
-For more algorithms and lower-level utilities, please refer to [the documentation](http://learn2learn.net/docs/learn2learn/) or the [examples](https://github.com/learnables/learn2learn/tree/master/examples).
+For more algorithms and lower-level utilities, please refer to the [documentation](http://learn2learn.net/docs/learn2learn/) or the [examples](https://github.com/learnables/learn2learn/tree/master/examples).
 
 ~~~python
 import learn2learn as l2l
@@ -27,7 +48,7 @@ task_generator = l2l.data.TaskGenerator(mnist,
                                         classes=[0, 1, 4, 6, 8, 9],
                                         tasks=10)
 model = Net()
-maml = l2l.MAML(model, lr=1e-3, first_order=False)
+maml = l2l.algorithms.MAML(model, lr=1e-3, first_order=False)
 opt = optim.Adam(maml.parameters(), lr=4e-3)
 
 for iteration in range(num_iterations):
@@ -41,7 +62,7 @@ for iteration in range(num_iterations):
 
     # Compute evaluation loss
     evaluation_task = task_generator.sample(shots=1,
-                                            classes=adaptation_task.sampled_classes)
+                                            task=adaptation_task.sampled_task)
     evaluation_error = compute_loss(evaluation_task)
 
     # Meta-update the model parameters
@@ -50,6 +71,6 @@ for iteration in range(num_iterations):
     opt.step()
 ~~~
 
-# Acknowledgements
+### Acknowledgements
 
 1. The RL environments are adapted from Tristan Deleu's [implementations](https://github.com/tristandeleu/pytorch-maml-rl) and from the ProMP [repository](https://github.com/jonasrothfuss/ProMP/). Both shared with permission, under the MIT License.
@@ -6,7 +6,37 @@ site_name: "learn2learn"
 # documented. Higher indentation leads to smaller header size.
 generate:
   - docs/learn2learn.md:
-      - learn2learn+
+      - learn2learn.clone_module
+      - learn2learn.detach_module
+      - learn2learn.magic_box
+  - docs/learn2learn.data.md:
+      - learn2learn.data.MetaDataset
+      - learn2learn.data.TaskGenerator++
+  - docs/learn2learn.algorithms.md:
+      - learn2learn.algorithms.MAML++
+      - learn2learn.algorithms.maml_update
+      - learn2learn.algorithms.MetaSGD++
+      - learn2learn.algorithms.meta_sgd_update
+  - docs/learn2learn.gym.md:
+      - learn2learn.gym++
+      - learn2learn.gym.envs.mujoco
+      - learn2learn.gym.envs.mujoco.HalfCheetahForwardBackwardEnv
+      - learn2learn.gym.envs.mujoco.AntForwardBackwardEnv
+      - learn2learn.gym.envs.mujoco.AntDirectionEnv
+      - learn2learn.gym.envs.mujoco.HumanoidForwardBackwardEnv
+      - learn2learn.gym.envs.mujoco.HumanoidDirectionEnv
+      - learn2learn.gym.envs.particles
+      - learn2learn.gym.envs.particles.Particles2DEnv
+  - docs/learn2learn.vision.md:
+      - learn2learn.vision.models
+      - learn2learn.vision.models.OmniglotFC
+      - learn2learn.vision.models.OmniglotCNN
+      - learn2learn.vision.datasets
+      - learn2learn.vision.datasets.FullOmniglot
+      - learn2learn.vision.transforms
+      - learn2learn.vision.transforms.RandomDiscreteRotation
+  - docs/learn2learn.text.md:
+      - learn2learn.text.datasets.NewsClassification
 
 # MkDocs pages configuration. The `<<` operator is sugar added by pydocmd
 # that allows you to use an external Markdown file (eg. your project's README)
@@ -18,8 +48,13 @@ pages:
       - Getting Started: tutorials/getting_started.md
   - Documentation:
       - learn2learn: docs/learn2learn.md
-  - Examples: https://github.com/seba-1511/learn2learn/tree/master/examples
-  - GitHub: https://github.com/seba-1511/learn2learn/
+      - learn2learn.algorithms: docs/learn2learn.algorithms.md
+      - learn2learn.data: docs/learn2learn.data.md
+      - learn2learn.gym: docs/learn2learn.gym.md
+      - learn2learn.text: docs/learn2learn.text.md
+      - learn2learn.vision: docs/learn2learn.vision.md
+  - Examples: https://github.com/learnables/learn2learn/tree/master/examples
+  - GitHub: https://github.com/learnables/learn2learn/
 
 # These options all show off their default values. You don't have to add
 # them to your configuration if you're fine with the default.
@@ -34,7 +69,7 @@ theme:
   custom_dir: 'l2l_theme/'
   highlightjs: true
 loader: pydocmd.loader.PythonLoader
-preprocessor: pydocmd.preprocessors.simple.Preprocessor
+preprocessor: pydocmd.preprocessor.Preprocessor
 # Whether to output headers as markdown or HTML.  Used to workaround
 # https://github.com/NiklasRosenstein/pydoc-markdown/issues/11.  The default is
 # to generate HTML with unique and meaningful id tags, which can't be done with
 
@@ -30,7 +30,9 @@ For more information about specific meta-learning algorithms, please refer to th
 appropriate tutorial.
 
 # How to Use L2L
+
 ## Installing
+
 A pip package is available, updated periodically. Use the command:
 
 ```pip install learn2learn```
@@ -48,6 +50,7 @@ encounter a problem, feel free to an open an [issue](https://github.com/learnabl
 look into it.
 
 ## Source Files
+
 Examples of learn2learn in action can be found [here](https://github.com/learnables/learn2learn/tree/master/examples).
 The source code for algorithm implementations is also available [here](https://github.com/learnables/learn2learn/tree/master/learn2learn/algorithms).
 
@@ -31,7 +31,7 @@ def forward(self, x=None):
 def main():
     task_dist = dist.Normal(th.zeros(2 * DIM), th.ones(2 * DIM))
     model = Model()
-    maml = l2l.MAML(model, lr=1e-2)
+    maml = l2l.algorithms.MAML(model, lr=1e-2)
     opt = optim.Adam(maml.parameters())
 
     for i in range(TIMESTEPS):
 
@@ -124,7 +124,7 @@ def make_env():
     policy = DiagNormalPolicy(input_size=env.state_size,
                               output_size=env.action_size,
                               hiddens=[64, 64])
-    meta_learner = l2l.MAML(policy, lr=meta_lr)
+    meta_learner = l2l.algorithms.MAML(policy, lr=meta_lr)
     baseline = LinearValue(env.state_size, env.action_size)
     opt = optim.Adam(meta_learner.parameters(), lr=meta_lr)
 
 
@@ -89,7 +89,7 @@ def make_env():
     env.seed(seed)
     env = ch.envs.Torch(env)
     policy = DiagNormalPolicy(env.state_size, env.action_size)
-    meta_learner = l2l.MAML(policy, lr=meta_lr)
+    meta_learner = l2l.algorithms.MAML(policy, lr=meta_lr)
     baseline = LinearValue(env.state_size, env.action_size)
     opt = optim.Adam(policy.parameters(), lr=meta_lr)
     all_rewards = []
 
@@ -79,7 +79,7 @@ def make_env():
     env.seed(seed)
     env = ch.envs.Torch(env)
     policy = DiagNormalPolicy(env.state_size, env.action_size)
-    meta_learner = l2l.MetaSGD(policy, lr=meta_lr)
+    meta_learner = l2l.algorithms.MetaSGD(policy, lr=meta_lr)
     baseline = LinearValue(env.state_size, env.action_size)
     opt = optim.Adam(policy.parameters(), lr=meta_lr)
     all_rewards = []
 
@@ -72,10 +72,10 @@ def precompute_quantities(states, actions, old_policy, new_policy):
 
 
 def main(
-        env_name='Particles2D-v1',
+        env_name='AntDirection-v1',
         adapt_lr=0.1,
         meta_lr=3e-4,
-        adapt_steps=1,
+        adapt_steps=3,
         num_iterations=1000,
         meta_bsz=40,
         adapt_bsz=20,
@@ -94,7 +94,9 @@ def main(
     th.manual_seed(seed)
 
     def make_env():
-        return gym.make(env_name)
+        env = gym.make(env_name)
+        env = ch.envs.ActionSpaceScaler(env)
+        return env
 
     env = l2l.gym.AsyncVectorEnv([make_env for _ in range(num_workers)])
     env.seed(seed)
@@ -104,7 +106,7 @@ def make_env():
                               output_size=env.action_size,
                               hiddens=[64, 64],
                               activation='tanh')
-    meta_learner = l2l.MAML(policy, lr=meta_lr)
+    meta_learner = l2l.algorithms.MAML(policy, lr=meta_lr)
     baseline = LinearValue(env.state_size, env.action_size)
     opt = optim.Adam(meta_learner.parameters(), lr=meta_lr)
 
 
@@ -76,9 +76,9 @@ def main(
     test_generator = l2l.data.TaskGenerator(dataset=test_dataset, ways=ways)
 
     # Create model
-    model = l2l.models.MiniImagenetCNN(ways)
+    model = l2l.vision.models.MiniImagenetCNN(ways)
     model.to(device)
-    maml = l2l.MAML(model, lr=fast_lr, first_order=False)
+    maml = l2l.algorithms.MAML(model, lr=fast_lr, first_order=False)
     opt = optim.Adam(maml.parameters(), meta_lr)
     loss = nn.CrossEntropyLoss(size_average=True, reduction='mean')
 
@@ -95,7 +95,7 @@ def main(
             learner = maml.clone()
             adaptation_data = train_generator.sample(shots=shots)
             evaluation_data = train_generator.sample(shots=shots,
-                                                     classes=adaptation_data.sampled_classes)
+                                                     task=adaptation_data.sampled_task)
             evaluation_error, evaluation_accuracy = fast_adapt(adaptation_data,
                                                                evaluation_data,
                                                                learner,
@@ -110,7 +110,7 @@ def main(
             learner = maml.clone()
             adaptation_data = valid_generator.sample(shots=shots)
             evaluation_data = valid_generator.sample(shots=shots,
-                                                     classes=adaptation_data.sampled_classes)
+                                                     task=adaptation_data.sampled_task)
             evaluation_error, evaluation_accuracy = fast_adapt(adaptation_data,
                                                                evaluation_data,
                                                                learner,
@@ -124,7 +124,7 @@ def main(
             learner = maml.clone()
             adaptation_data = test_generator.sample(shots=shots)
             evaluation_data = test_generator.sample(shots=shots,
-                                                    classes=adaptation_data.sampled_classes)
+                                                    task=adaptation_data.sampled_task)
             evaluation_error, evaluation_accuracy = fast_adapt(adaptation_data,
                                                                evaluation_data,
                                                                learner,
 
@@ -71,9 +71,9 @@ def main(
     test_generator = l2l.data.TaskGenerator(dataset=omniglot, ways=ways, classes=classes[1200:])
 
     # Create model
-    model = l2l.models.OmniglotFC(28 ** 2, ways)
+    model = l2l.vision.models.OmniglotFC(28 ** 2, ways)
     model.to(device)
-    maml = l2l.MAML(model, lr=fast_lr, first_order=False)
+    maml = l2l.algorithms.MAML(model, lr=fast_lr, first_order=False)
     opt = optim.Adam(maml.parameters(), meta_lr)
     loss = nn.CrossEntropyLoss(size_average=True, reduction='mean')
 
@@ -90,7 +90,7 @@ def main(
             learner = maml.clone()
             adaptation_data = train_generator.sample(shots=shots)
             evaluation_data = train_generator.sample(shots=shots,
-                                                     classes=adaptation_data.sampled_classes)
+                                                     task=adaptation_data.sampled_task)
             evaluation_error, evaluation_accuracy = fast_adapt(adaptation_data,
                                                                evaluation_data,
                                                                learner,
@@ -105,7 +105,7 @@ def main(
             learner = maml.clone()
             adaptation_data = valid_generator.sample(shots=shots)
             evaluation_data = valid_generator.sample(shots=shots,
-                                                     classes=adaptation_data.sampled_classes)
+                                                     task=adaptation_data.sampled_task)
             evaluation_error, evaluation_accuracy = fast_adapt(adaptation_data,
                                                                evaluation_data,
                                                                learner,
@@ -119,7 +119,7 @@ def main(
             learner = maml.clone()
             adaptation_data = test_generator.sample(shots=shots)
             evaluation_data = test_generator.sample(shots=shots,
-                                                    classes=adaptation_data.sampled_classes)
+                                                    task=adaptation_data.sampled_task)
             evaluation_error, evaluation_accuracy = fast_adapt(adaptation_data,
                                                                evaluation_data,
                                                                learner,
 
@@ -71,7 +71,7 @@ def main(lr=0.005, maml_lr=0.01, iterations=1000, ways=5, shots=1, tps=32, fas=5
 
     model = Net(ways)
     model.to(device)
-    meta_model = l2l.MAML(model, lr=maml_lr)
+    meta_model = l2l.algorithms.MAML(model, lr=maml_lr)
     opt = optim.Adam(meta_model.parameters(), lr=lr)
     loss_func = nn.NLLLoss(reduction="sum")
 
 
@@ -17,7 +17,7 @@
 from torchvision import transforms
 
 import learn2learn as l2l
-from learn2learn.models import OmniglotCNN
+from learn2learn.vision.models import OmniglotCNN
 from learn2learn.vision.datasets.full_omniglot import FullOmniglot
 
 
 
@@ -3,9 +3,7 @@
 from . import algorithms
 from . import data
 from . import gym
-from . import models
 from . import text
 from . import vision
 from ._version import __version__
-from .algorithms import MAML, MetaSGD, magic_box
 from .utils import *
@@ -1,5 +1,4 @@
 #!/usr/bin/env python3
 
-from .dice import magic_box
-from .maml import MAML
-from .meta_sgd import MetaSGD
+from .maml import MAML, maml_update
+from .meta_sgd import MetaSGD, meta_sgd_update