1
0
mirror of https://github.com/gsi-upm/senpy synced 2025-01-09 21:11:27 +00:00

Compare commits

..

No commits in common. "45421f4613f0c7a450bd1c42b5e78a417277aa78" and "8a516d927e1621eb3e6c11e36a6f45395d65e80e" have entirely different histories.

19 changed files with 7245 additions and 6604 deletions

View File

@ -21,16 +21,16 @@ before_script:
except: except:
- tags # Avoid unnecessary double testing - tags # Avoid unnecessary double testing
test-3.6: test-3.5:
<<: *test_definition <<: *test_definition
variables: variables:
PYTHON_VERSION: "3.6" PYTHON_VERSION: "3.5"
test-3.7: test-2.7:
<<: *test_definition <<: *test_definition
allow_failure: true allow_failure: true
variables: variables:
PYTHON_VERSION: "3.7" PYTHON_VERSION: "2.7"
push: push:
stage: push stage: push
@ -101,3 +101,4 @@ cleanup_py:
when: always # this is important; run even if preceding stages failed. when: always # this is important; run even if preceding stages failed.
script: script:
- rm -vf ~/.pypirc # we don't want to leave these around, but GitLab may clean up anyway. - rm -vf ~/.pypirc # we don't want to leave these around, but GitLab may clean up anyway.
- docker logout

View File

@ -6,10 +6,7 @@ services:
language: python language: python
env: env:
- PYV=3.4 - PYV=2.7
- PYV=3.5 - PYV=3.5
- PYV=3.6
- PYV=3.7
# - PYV=3.3 # Apt fails in this docker image
# run nosetests - Tests # run nosetests - Tests
script: make test-$PYV script: make test-$PYV

View File

@ -6,11 +6,6 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
## [Unreleased] ## [Unreleased]
### Fixed
* Restored hash changing function in `main.js`
## 0.20
### Added ### Added
* Objects can control the keys that will be used in `serialize`/`jsonld`/`as_dict` by specifying a list of keys in `terse_keys`. * Objects can control the keys that will be used in `serialize`/`jsonld`/`as_dict` by specifying a list of keys in `terse_keys`.
e.g. e.g.
@ -32,7 +27,6 @@ e.g.
* Plugin and parameter descriptions are now formatted with (showdown)[https://github.com/showdownjs/showdown]. * Plugin and parameter descriptions are now formatted with (showdown)[https://github.com/showdownjs/showdown].
* The web UI requests extra_parameters from the server. This is useful for pipelines. See #52 * The web UI requests extra_parameters from the server. This is useful for pipelines. See #52
* First batch of semantic tests (using SPARQL) * First batch of semantic tests (using SPARQL)
* `Plugin.path()` method to get a file path from a relative path (using the senpy data folder)
### Changed ### Changed
* `install_deps` now checks what requirements are already met before installing with pip. * `install_deps` now checks what requirements are already met before installing with pip.

File diff suppressed because it is too large Load Diff

View File

@ -1,152 +0,0 @@
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Senpy in 1 minute\n",
"\n",
"This mini-tutorial only shows how to annotate with a service.\n",
"We will use the [demo server](http://senpy.gsi.upm.es), which runs some open source plugins for sentiment and emotion analysis."
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Annotating with senpy is as simple as issuing an HTTP request to the API using your favourite tool.\n",
"This is just an example using curl:"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"{\r\n",
" \"@context\": \"http://senpy.gsi.upm.es/api/contexts/YXBpL3NlbnRpbWVudDE0MD8j\",\r\n",
" \"@type\": \"Results\",\r\n",
" \"entries\": [\r\n",
" {\r\n",
" \"@id\": \"prefix:\",\r\n",
" \"@type\": \"Entry\",\r\n",
" \"marl:hasOpinion\": [\r\n",
" {\r\n",
" \"@type\": \"Sentiment\",\r\n",
" \"marl:hasPolarity\": \"marl:Positive\",\r\n",
" \"prov:wasGeneratedBy\": \"prefix:Analysis_1554389334.6431913\"\r\n",
" }\r\n",
" ],\r\n",
" \"nif:isString\": \"Senpy is awesome\",\r\n",
" \"onyx:hasEmotionSet\": []\r\n",
" }\r\n",
" ]\r\n",
"}"
]
}
],
"source": [
"!curl \"http://senpy.gsi.upm.es/api/sentiment140\" --data-urlencode \"input=Senpy is awesome\""
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"**Congratulations**, you've used your first senpy service!"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Here is the equivalent using the `requests` library:"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {
"scrolled": true
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"{\n",
" \"@context\": \"http://senpy.gsi.upm.es/api/contexts/YXBpL3NlbnRpbWVudDE0MD9pbnB1dD1TZW5weStpcythd2Vzb21lIw%3D%3D\",\n",
" \"@type\": \"Results\",\n",
" \"entries\": [\n",
" {\n",
" \"@id\": \"prefix:\",\n",
" \"@type\": \"Entry\",\n",
" \"marl:hasOpinion\": [\n",
" {\n",
" \"@type\": \"Sentiment\",\n",
" \"marl:hasPolarity\": \"marl:Positive\",\n",
" \"prov:wasGeneratedBy\": \"prefix:Analysis_1554389335.9803226\"\n",
" }\n",
" ],\n",
" \"nif:isString\": \"Senpy is awesome\",\n",
" \"onyx:hasEmotionSet\": []\n",
" }\n",
" ]\n",
"}\n"
]
}
],
"source": [
"import requests\n",
"res = requests.get('http://senpy.gsi.upm.es/api/sentiment140',\n",
" params={\"input\": \"Senpy is awesome\",})\n",
"print(res.text)"
]
}
],
"metadata": {
"anaconda-cloud": {},
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.3"
},
"toc": {
"colors": {
"hover_highlight": "#DAA520",
"running_highlight": "#FF0000",
"selected_highlight": "#FFD700"
},
"moveMenuLeft": true,
"nav_menu": {
"height": "68px",
"width": "252px"
},
"navigate_menu": true,
"number_sections": true,
"sideBar": true,
"threshold": 4,
"toc_cell": false,
"toc_section_display": "block",
"toc_window_display": false
}
},
"nbformat": 4,
"nbformat_minor": 1
}

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

2599
docs/Quickstart.rst Normal file

File diff suppressed because it is too large Load Diff

View File

@ -7,4 +7,3 @@ Advanced usage
server-cli server-cli
conversion conversion
commandline commandline
development

View File

@ -38,8 +38,6 @@ extensions = [
'sphinxcontrib.httpdomain', 'sphinxcontrib.httpdomain',
'sphinx.ext.coverage', 'sphinx.ext.coverage',
'sphinx.ext.autosectionlabel', 'sphinx.ext.autosectionlabel',
'nbsphinx',
'sphinx.ext.mathjax',
] ]
# Add any paths that contain templates here, relative to this directory. # Add any paths that contain templates here, relative to this directory.
@ -56,7 +54,7 @@ master_doc = 'index'
# General information about the project. # General information about the project.
project = u'Senpy' project = u'Senpy'
copyright = u'2019, J. Fernando Sánchez' copyright = u'2016, J. Fernando Sánchez'
description = u'A framework for sentiment and emotion analysis services' description = u'A framework for sentiment and emotion analysis services'
# The version info for the project you're documenting, acts as replacement for # The version info for the project you're documenting, acts as replacement for
@ -81,9 +79,7 @@ language = None
# List of patterns, relative to source directory, that match files and # List of patterns, relative to source directory, that match files and
# directories to ignore when looking for source files. # directories to ignore when looking for source files.
exclude_patterns = ['_build', '**.ipynb_checkpoints'] exclude_patterns = ['_build']
# The reST default role (used for this markup: `text`) to use for all # The reST default role (used for this markup: `text`) to use for all
# documents. # documents.
@ -290,13 +286,3 @@ texinfo_documents = [
# If true, do not generate a @detailmenu in the "Top" node's menu. # If true, do not generate a @detailmenu in the "Top" node's menu.
#texinfo_no_detailmenu = False #texinfo_no_detailmenu = False
nbsphinx_prolog = """
.. note:: This page has been auto-generated from a Jupyter notebook using nbsphinx_.
The original source is available at: https://github.com/gsi-upm/senpy/tree/master/docs//{{ env.doc2path(env.docname, base=None) }}
.. _nbsphinx: https://nbsphinx.readthedocs.io/
----
"""

View File

@ -4,10 +4,11 @@ Demo
There is a demo available on http://senpy.gsi.upm.es/, where you can test a live instance of Senpy, with several open source plugins. There is a demo available on http://senpy.gsi.upm.es/, where you can test a live instance of Senpy, with several open source plugins.
You can use the playground (a web interface) or make HTTP requests to the service API. You can use the playground (a web interface) or make HTTP requests to the service API.
.. image:: playground-0.20.png .. image:: senpy-playground.png
:target: http://senpy.gsi.upm.es :height: 400px
:width: 800px :width: 800px
:scale: 100 %
:align: center :align: center
The source code and description of the plugins used in the demo are available here: https://github.com/gsi-upm/senpy-plugins-community/. The source code and description of the plugins used in the demo are available here: https://lab.gsi.upm.es/senpy/senpy-plugins-community/.

View File

@ -1,6 +1,5 @@
Welcome to Senpy's documentation! Welcome to Senpy's documentation!
================================= =================================
.. image:: https://readthedocs.org/projects/senpy/badge/?version=latest .. image:: https://readthedocs.org/projects/senpy/badge/?version=latest
:target: http://senpy.readthedocs.io/en/latest/ :target: http://senpy.readthedocs.io/en/latest/
.. image:: https://badge.fury.io/py/senpy.svg .. image:: https://badge.fury.io/py/senpy.svg
@ -13,6 +12,7 @@ Welcome to Senpy's documentation!
:target: https://lab.gsi.upm.es/senpy/senpy/ :target: https://lab.gsi.upm.es/senpy/senpy/
Senpy is a framework for sentiment and emotion analysis services. Senpy is a framework for sentiment and emotion analysis services.
Senpy services are interchangeable and easy to use because they share a common semantic :doc:`apischema`. Senpy services are interchangeable and easy to use because they share a common semantic :doc:`apischema`.
@ -20,16 +20,15 @@ If you interested in consuming Senpy services, read :doc:`Quickstart`.
To get familiar with the concepts behind Senpy, and what it can offer for service developers, check out :doc:`development`. To get familiar with the concepts behind Senpy, and what it can offer for service developers, check out :doc:`development`.
:doc:`apischema` contains information about the semantic models and vocabularies used by Senpy. :doc:`apischema` contains information about the semantic models and vocabularies used by Senpy.
.. toctree:: .. toctree::
:caption: Learn more about senpy: :caption: Learn more about senpy:
:maxdepth: 2 :maxdepth: 2
senpy senpy
demo Quickstart
Quickstart.ipynb
installation installation
development
apischema apischema
advanced advanced
demo
publications publications

Binary file not shown.

Before

Width:  |  Height:  |  Size: 68 KiB

View File

@ -22,7 +22,7 @@ Hence, two parts are necessary: 1) the code that will process the entry, and 2)
In practice, this is what a plugin looks like, tests included: In practice, this is what a plugin looks like, tests included:
.. literalinclude:: ../example-plugins/rand_plugin.py .. literalinclude:: ../senpy/plugins/example/rand_plugin.py
:emphasize-lines: 5-11 :emphasize-lines: 5-11
:language: python :language: python
@ -76,9 +76,8 @@ Most plugins will need access to files (dictionaries, lexicons, etc.).
These files are usually heavy or under a license that does not allow redistribution. These files are usually heavy or under a license that does not allow redistribution.
For this reason, senpy has a `data_folder` that is separated from the source files. For this reason, senpy has a `data_folder` that is separated from the source files.
The location of this folder is controlled programmatically or by setting the `SENPY_DATA` environment variable. The location of this folder is controlled programmatically or by setting the `SENPY_DATA` environment variable.
You can use the `self.path(filepath)` function to get the path of a given `filepath` within the data folder.
Plugins have a convenience function `self.open` which will automatically look for the file if it exists, or open a new one if it doesn't: Plugins have a convenience function `self.open` which will automatically prepend the data folder to relative paths:
.. code:: python .. code:: python
@ -133,7 +132,7 @@ And you can run it with:
docker run -p 5000:5000 gsiupm/exampleplugin docker run -p 5000:5000 gsiupm/exampleplugin
If the plugin uses non-source files (:ref:`How should I load external data and files`), the recommended way is to use `SENPY_DATA` folder. If the plugin uses non-source files (:ref:`loading data and files`), the recommended way is to use `SENPY_DATA` folder.
Data can then be mounted in the container or added to the image. Data can then be mounted in the container or added to the image.
The former is recommended for open source plugins with licensed resources, whereas the latter is the most convenient and can be used for private images. The former is recommended for open source plugins with licensed resources, whereas the latter is the most convenient and can be used for private images.

View File

@ -1,3 +1,2 @@
sphinxcontrib-httpdomain>=1.4 sphinxcontrib-httpdomain>=1.4
ipykernel
nbsphinx nbsphinx

View File

@ -18,10 +18,10 @@ And higher level features can be built on top of these services, such as automat
These benefits are not limited to new services. These benefits are not limited to new services.
The community has developed wrappers for some proprietary and commercial services (such as sentiment140 and Meaning Cloud), so you can consult them as. The community has developed wrappers for some proprietary and commercial services (such as sentiment140 and Meaning Cloud), so you can consult them as.
Senpy comes with a built-in client in the client package. Senpy comes with a :ref:`built-in client`.
To achieve this goal, Senpy uses a Linked Data principled approach, based on the NIF (NLP Interchange Format) specification, and open vocabularies such as Marl and Onyx. To achieve this goal, Senpy uses a Linked Data principled approach, based on the NIF (NLP Interchange Format) specification, and open vocabularies such as Marl and Onyx.
You can learn more about this in :doc:`vocabularies`. You can learn more about this in :doc:`vocabularies`.
Check out :doc:`development` if you have developed an analysis algorithm (e.g. sentiment analysis) and you want to publish it as a service. Check out :doc:`plugins` if you have developed an analysis algorithm (e.g. sentiment analysis) and you want to publish it as a service.

View File

@ -251,15 +251,11 @@ class Plugin(with_metaclass(PluginMeta, models.Plugin)):
return alternative return alternative
raise IOError('File does not exist: {}'.format(fname)) raise IOError('File does not exist: {}'.format(fname))
def path(self, fpath):
if not os.path.isabs(fpath):
fpath = os.path.join(self.data_folder, fpath)
return fpath
def open(self, fpath, mode='r'): def open(self, fpath, mode='r'):
if 'w' in mode: if 'w' in mode:
# When writing, only use absolute paths or data_folder # When writing, only use absolute paths or data_folder
fpath = self.path(fpath) if not os.path.isabs(fpath):
fpath = os.path.join(self.data_folder, fpath)
else: else:
fpath = self.find_file(fpath) fpath = self.find_file(fpath)
@ -385,9 +381,7 @@ class SentimentPlugin(Analyser, Evaluable, models.SentimentPlugin):
activity = self.activity(parameters) activity = self.activity(parameters)
entries = [] entries = []
for feat in X: for feat in X:
if isinstance(feat, list): entries.append(models.Entry(nif__isString=feat[0]))
feat = ' '.join(feat)
entries.append(models.Entry(nif__isString=feat))
labels = [] labels = []
for e in self.process_entries(entries, activity): for e in self.process_entries(entries, activity):
sent = e.sentiments[0].polarity sent = e.sentiments[0].polarity

View File

@ -203,8 +203,8 @@ $(document).ready(function() {
draw_datasets(); draw_datasets();
} }
$(window).on('hashchange', hashchanged); // $(window).on('hashchange', hashchanged);
hashchanged(); // hashchanged();
$('.tooltip-form').tooltip(); $('.tooltip-form').tooltip();
$('.nav-pills a').on('shown.bs.tab', function (e) { $('.nav-pills a').on('shown.bs.tab', function (e) {

View File

@ -320,32 +320,24 @@ class PluginsTest(TestCase):
for i in range(50): for i in range(50):
testdata.append(["good", 1]) testdata.append(["good", 1])
for i in range(50): for i in range(50):
testdata.append(["bad", -1]) testdata.append(["bad", 0])
dataset = pd.DataFrame(testdata, columns=['text', 'polarity']) dataset = pd.DataFrame(testdata, columns=['text', 'polarity'])
class DummyPlugin(plugins.SentimentBox): class DummyPlugin(plugins.SentimentBox):
description = 'Plugin to test evaluation' description = 'Plugin to test evaluation'
version = 0 version = 0
classes = ['marl:Positive', 'marl:Negative']
def predict_one(self, features, **kwargs): def predict_one(self, features, **kwargs):
print(features[0]) return 0
return [0, 1]
class SmartPlugin(plugins.SentimentBox): class SmartPlugin(plugins.SentimentBox):
description = 'Plugin to test evaluation' description = 'Plugin to test evaluation'
version = 0 version = 0
classes = ['marl:Positive', 'marl:Negative']
def predict_one(self, features, **kwargs): def predict_one(self, features, **kwargs):
print(features[0])
if features[0] == 'good': if features[0] == 'good':
print('positive') return 1
return [1, 0] return 0
print('negative')
return [0, 1]
dpipe = DummyPlugin() dpipe = DummyPlugin()
results = plugins.evaluate(datasets={'testdata': dataset}, plugins=[dpipe], flatten=True) results = plugins.evaluate(datasets={'testdata': dataset}, plugins=[dpipe], flatten=True)