intel
diff --git a/‎CHANGELOG.md‎
Lines changed: 1 addition & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎dffml/__init__.py‎
Lines changed: 11 additions & 3 deletions b/‎dffml/__init__.py‎
Lines changed: 11 additions & 3 deletions
diff --git a/‎dffml/cli/ml.py‎
Lines changed: 7 additions & 16 deletions b/‎dffml/cli/ml.py‎
Lines changed: 7 additions & 16 deletions
diff --git a/‎dffml/high_level.py‎
Lines changed: 143 additions & 0 deletions b/‎dffml/high_level.py‎
Lines changed: 143 additions & 0 deletions
diff --git a/‎dffml/model/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎dffml/model/__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎dffml/accuracy.py‎ ‎dffml/model/accuracy.py‎dffml/accuracy.py renamed to dffml/model/accuracy.py b/‎dffml/accuracy.py‎ ‎dffml/model/accuracy.py‎dffml/accuracy.py renamed to dffml/model/accuracy.py
diff --git a/‎dffml/model/model.py‎
Lines changed: 1 addition & 1 deletion b/‎dffml/model/model.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎dffml/noasync.py‎
Lines changed: 31 additions & 0 deletions b/‎dffml/noasync.py‎
Lines changed: 31 additions & 0 deletions
diff --git a/‎dffml/skel/model/REPLACE_IMPORT_PACKAGE_NAME/misc.py‎
Lines changed: 1 addition & 1 deletion b/‎dffml/skel/model/REPLACE_IMPORT_PACKAGE_NAME/misc.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎dffml/source/file.py‎
Lines changed: 1 addition & 3 deletions b/‎dffml/source/file.py‎
Lines changed: 1 addition & 3 deletions
@@ -57,6 +57,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Subclasses of `BaseConfigurable` will now auto instantiate their respective
   config classes using `kwargs` if the config argument isn't given and keyword
   arguments are.
+- The quickstart documentation was improved as well as the structure of docs.
 ### Fixed
 - CONTRIBUTING.md has `-e` in the wrong place in the getting setup section.
 - Since moving to auto `args()` and `config()`, BaseConfigurable no longer
 
@@ -1,6 +1,14 @@
-# SPDX-License-Identifier: MIT
-# Copyright (c) 2019 Intel Corporation
-from .feature import Feature
+# General
+from .high_level import train, accuracy, predict
+from .feature import Features, Feature, DefFeature
+
+# Sources
+from .source.source import Sources, BaseSource, BaseSourceContext
+from .source.csv import CSVSource
+from .source.json import JSONSource
+
+# Models
+from .model import Model, ModelContext
 
 # Used to declare our namespace for resource discovery
 __import__("pkg_resources").declare_namespace(__name__)
@@ -1,6 +1,7 @@
 from ..source.source import SubsetSources
 from ..util.cli.arg import Arg
 from ..util.cli.cmd import CMD
+from ..high_level import train, predict, accuracy
 from ..util.cli.cmds import SourcesCMD, ModelCMD, KeysCMD
 
 
@@ -22,18 +23,14 @@ class Train(MLCMD):
     """
 
     async def run(self):
-        async with self.sources as sources, self.model as model:
-            async with sources() as sctx, model() as mctx:
-                return await mctx.train(sctx)
+        return await train(self.model, self.sources)
 
 
 class Accuracy(MLCMD):
     """Assess model accuracy on data from given sources"""
 
     async def run(self):
-        async with self.sources as sources, self.model as model:
-            async with sources() as sctx, model() as mctx:
-                return float(await mctx.accuracy(sctx))
+        return await accuracy(self.model, self.sources)
 
 
 class PredictAll(MLCMD):
@@ -47,17 +44,11 @@ class PredictAll(MLCMD):
         action="store_true",
     )
 
-    async def predict(self, mctx, sctx, repos):
-        async for repo in mctx.predict(repos):
-            yield repo
-            if self.update:
-                await sctx.update(repo)
-
     async def run(self):
-        async with self.sources as sources, self.model as model:
-            async with sources() as sctx, model() as mctx:
-                async for repo in self.predict(mctx, sctx, sctx.repos()):
-                    yield repo
+        async for repo in predict(
+            self.model, self.sources, update=self.update, keep_repo=True
+        ):
+            yield repo
 
 
 class PredictRepo(PredictAll, KeysCMD):
 
@@ -0,0 +1,143 @@
+"""
+High level abstraction interfaces to DFFML. These are probably going to be used
+in a lot of quick and dirty python files.
+"""
+import pathlib
+from typing import Union, Dict, Any
+
+from .repo import Repo
+from .source.source import Sources, BaseSource
+from .source.memory import MemorySource, MemorySourceConfig
+
+
+def _repos_to_sources(*args):
+    """
+    Create a memory source out of any repos passed as a variable length list.
+    Add all sources found in the variable length list to a list of sources, and
+    the created source containing repos, and return that list of sources.
+    """
+    # If the first arg is an instance of sources, append the rest to that.
+    if args and isinstance(args[0], Sources):
+        sources = args[0]
+    else:
+        sources = Sources(
+            *[arg for arg in args if isinstance(arg, BaseSource)]
+        )
+    # Repos to add to memory source
+    repos = []
+    # Make args mutable
+    args = list(args)
+    # Convert dicts to repos
+    for i, arg in enumerate(args):
+        if isinstance(arg, dict):
+            arg = Repo(i, data={"features": arg})
+        if isinstance(arg, Repo):
+            repos.append(arg)
+        if isinstance(arg, str) and "." in arg:
+            filepath = pathlib.Path(arg)
+            source = BaseSource.load(filepath.suffix.replace(".", ""))
+            sources.append(source(filename=arg))
+    # Create memory source if there are any repos
+    if repos:
+        sources.append(MemorySource(MemorySourceConfig(repos=repos)))
+    return sources
+
+
+async def train(model, *args: Union[BaseSource, Repo, Dict[str, Any]]):
+    """
+    Train a machine learning model.
+
+    Provide records to the model to train it. The model should be already
+    instantiated.
+
+    Parameters
+    ----------
+    model : Model
+        Machine Learning model to use. See :doc:`/plugins/dffml_model` for
+        models options.
+    *args : list
+        Input data for training. Could be a ``dict``, :py:class:`Repo`,
+        filename, one of the data :doc:`/plugins/dffml_source`, or a filename
+        with the extension being one of the data sources.
+    """
+    sources = _repos_to_sources(*args)
+    async with sources as sources, model as model:
+        async with sources() as sctx, model() as mctx:
+            return await mctx.train(sctx)
+
+
+async def accuracy(
+    model, *args: Union[BaseSource, Repo, Dict[str, Any]]
+) -> float:
+    """
+    Assess the accuracy of a machine learning model.
+
+    Provide records to the model to assess the percent accuracy of its
+    prediction abilities. The model should be already instantiated and trained.
+
+    Parameters
+    ----------
+    model : Model
+        Machine Learning model to use. See :doc:`/plugins/dffml_model` for
+        models options.
+    *args : list
+        Input data for training. Could be a ``dict``, :py:class:`Repo`,
+        filename, one of the data :doc:`/plugins/dffml_source`, or a filename
+        with the extension being one of the data sources.
+
+    Returns
+    -------
+    float
+        A decimal value representing the percent of the time the model made the
+        correct prediction. For some models this has another meaning. Please see
+        the documentation for the model your using for further details.
+    """
+    sources = _repos_to_sources(*args)
+    async with sources as sources, model as model:
+        async with sources() as sctx, model() as mctx:
+            return float(await mctx.accuracy(sctx))
+
+
+async def predict(
+    model,
+    *args: Union[BaseSource, Repo, Dict[str, Any]],
+    update: bool = False,
+    keep_repo: bool = False,
+):
+    """
+    Make a prediction using a machine learning model.
+
+    The model must be trained before using it to make a prediction.
+
+    Parameters
+    ----------
+    model : Model
+        Machine Learning model to use. See :doc:`/plugins/dffml_model` for
+        models options.
+    *args : list
+        Input data for prediction. Could be a ``dict``, :py:class:`Repo`,
+        filename, or one of the data :doc:`/plugins/dffml_source`.
+    update : boolean, optional
+        If ``True`` prediction data within records will be written back to all
+        sources given. Defaults to ``False``.
+    keep_repo : boolean, optional
+        If ``True`` the results will be kept as their ``Repo`` objects instead
+        of being converted to a ``(repo.key, features, predictions)`` tuple.
+        Defaults to ``False``.
+
+    Returns
+    -------
+    asynciterator
+        ``Repo`` objects or ``(repo.key, features, predictions)`` tuple.
+    """
+    sources = _repos_to_sources(*args)
+    async with sources as sources, model as model:
+        async with sources() as sctx, model() as mctx:
+            async for repo in mctx.predict(sctx.repos()):
+                yield repo if keep_repo else (
+                    repo.key,
+                    repo.features(),
+                    repo.predictions(),
+                )
+                if update:
+                    await sctx.update(repo)
@@ -15,7 +15,7 @@
 >>>     },
 >>> )
 """
-from .model import Model
+from .model import Model, ModelContext
 
 # Declares dffml.model as a namespace package
 __import__("pkg_resources").declare_namespace(__name__)
@@ -17,7 +17,7 @@
 from ..repo import Repo
 from ..source.source import Sources
 from ..feature import Features
-from ..accuracy import Accuracy
+from .accuracy import Accuracy
 from ..util.entrypoint import base_entry_point
 
 
 
@@ -0,0 +1,31 @@
+import asyncio
+
+from . import high_level
+
+
+def train(*args, **kwargs):
+    return asyncio.run(high_level.train(*args, **kwargs))
+
+
+def accuracy(*args, **kwargs):
+    return asyncio.run(high_level.accuracy(*args, **kwargs))
+
+
+def predict(*args, **kwargs):
+    async_gen = high_level.predict(*args, **kwargs).__aiter__()
+
+    loop = asyncio.new_event_loop()
+
+    def cleanup():
+        loop.run_until_complete(loop.shutdown_asyncgens())
+        loop.close()
+
+    while True:
+        try:
+            yield loop.run_until_complete(async_gen.__anext__())
+        except StopAsyncIteration:
+            cleanup()
+            return
+        except:
+            cleanup()
+            raise
@@ -8,7 +8,7 @@
 from dffml.repo import Repo
 from dffml.source.source import Sources
 from dffml.feature import Features
-from dffml.accuracy import Accuracy
+from dffml.model.accuracy import Accuracy
 from dffml.model.model import ModelContext, Model
 from dffml.util.entrypoint import entrypoint
 from dffml.base import config
 
@@ -112,9 +112,7 @@ def zip_opener_helper(self):
     @contextmanager
     def zip_closer_helper(self):
         with zipfile.ZipFile(
-            self.config.filename,
-            self.WRITEMODE,
-            compression=zipfile.ZIP_BZIP2,
+            self.config.filename, self.WRITEMODE, compression=zipfile.ZIP_BZIP2
         ) as archive:
             with archive.open(
                 self.__class__.__qualname__,