Merge pull request #85 from IndicoDataSolutions/keywords

ADD: keywords api support
This commit is contained in:
Madison May
2015-07-07 12:09:54 -04:00
10 changed files with 80 additions and 30 deletions
+2
View File
@@ -13,6 +13,7 @@ from indicoio.text.sentiment import political, posneg, sentiment_hq
from indicoio.text.sentiment import posneg as sentiment from indicoio.text.sentiment import posneg as sentiment
from indicoio.text.lang import language from indicoio.text.lang import language
from indicoio.text.tagging import text_tags from indicoio.text.tagging import text_tags
from indicoio.text.keywords import keywords
from indicoio.images.fer import fer from indicoio.images.fer import fer
from indicoio.images.features import facial_features from indicoio.images.features import facial_features
from indicoio.images.features import image_features from indicoio.images.features import image_features
@@ -20,6 +21,7 @@ from indicoio.utils.multi import predict_image, predict_text
from indicoio.config import API_NAMES from indicoio.config import API_NAMES
apis = dict((api, globals().get(api)) for api in API_NAMES) apis = dict((api, globals().get(api)) for api in API_NAMES)
for api in apis: for api in apis:
+2 -1
View File
@@ -50,7 +50,8 @@ TEXT_APIS = [
'political', 'political',
'sentiment', 'sentiment',
'language', 'language',
'sentiment_hq' 'sentiment_hq',
'keywords'
] ]
IMAGE_APIS = [ IMAGE_APIS = [
+4 -2
View File
@@ -26,7 +26,8 @@ def facial_features(image, cloud=None, batch=False, api_key=None, **kwargs):
:rtype: List containing feature responses :rtype: List containing feature responses
""" """
image = image_preprocess(image, batch=batch) image = image_preprocess(image, batch=batch)
return api_handler(image, cloud=cloud, api="facialfeatures", url_params={"batch":batch, "api_key":api_key}, **kwargs) url_params = {"batch": batch, "api_key": api_key}
return api_handler(image, cloud=cloud, api="facialfeatures", url_params=url_params, **kwargs)
def image_features(image, cloud=None, batch=False, api_key=None, **kwargs): def image_features(image, cloud=None, batch=False, api_key=None, **kwargs):
""" """
@@ -59,4 +60,5 @@ def image_features(image, cloud=None, batch=False, api_key=None, **kwargs):
:rtype: List containing features :rtype: List containing features
""" """
image = image_preprocess(image, batch=batch, size=(64,64)) image = image_preprocess(image, batch=batch, size=(64,64))
return api_handler(image, cloud=cloud, api="imagefeatures", url_params={"batch":batch, "api_key":api_key}, **kwargs) url_params = {"batch": batch, "api_key": api_key}
return api_handler(image, cloud=cloud, api="imagefeatures", url_params=url_params, **kwargs)
+2 -1
View File
@@ -28,4 +28,5 @@ def fer(image, cloud=None, batch=False, api_key=None, **kwargs):
:rtype: Dictionary containing emotion probability pairs :rtype: Dictionary containing emotion probability pairs
""" """
image = image_preprocess(image, batch=batch) image = image_preprocess(image, batch=batch)
return api_handler(image, cloud=cloud, api="fer", url_params={"batch":batch, "api_key":api_key}, **kwargs) url_params = {"batch": batch, "api_key": api_key}
return api_handler(image, cloud=cloud, api="fer", url_params=url_params, **kwargs)
+24
View File
@@ -0,0 +1,24 @@
from indicoio.utils.api import api_handler
import indicoio.config as config
def keywords(text, cloud=None, batch=False, api_key=None, **kwargs):
"""
Given input text, returns series of keywords and associated scores
Example usage:
.. code-block:: python
>>> import indicoio
>>> import numpy as np
>>> text = 'Monday: Delightful with mostly sunny skies. Highs in the low 70s.'
>>> keywords = indicoio.keywords(text, top_n=3)
>>> print "The keywords are: "+str(keywords.keys())
u'The keywords are ['delightful', 'highs', 'skies']
:param text: The text to be analyzed.
:type text: str or unicode
:rtype: Dictionary of feature score pairs
"""
url_params = {'batch': batch, 'api_key': api_key}
return api_handler(text, cloud=cloud, api="keywords", url_params=url_params, **kwargs)
+2 -2
View File
@@ -23,5 +23,5 @@ def language(text, cloud=None, batch=False, api_key=None, **kwargs):
:type text: str or unicode :type text: str or unicode
:rtype: Dictionary of language probability pairs :rtype: Dictionary of language probability pairs
""" """
url_params = {"batch": batch, "api_key": api_key}
return api_handler(text, cloud=cloud, api="language", url_params={"batch":batch, "api_key":api_key}, **kwargs) return api_handler(text, cloud=cloud, api="language", url_params=url_params, **kwargs)
+6 -6
View File
@@ -25,8 +25,8 @@ def political(text, cloud=None, batch=False, api_key=None, **kwargs):
:type text: str or unicode :type text: str or unicode
:rtype: Dictionary of party probability pairs :rtype: Dictionary of party probability pairs
""" """
url_params = {"batch": batch, "api_key": api_key}
return api_handler(text, cloud=cloud, api="political", url_params={"batch":batch, "api_key":api_key}, **kwargs) return api_handler(text, cloud=cloud, api="political", url_params=url_params, **kwargs)
def posneg(text, cloud=None, batch=False, api_key=None, **kwargs): def posneg(text, cloud=None, batch=False, api_key=None, **kwargs):
""" """
@@ -48,8 +48,8 @@ def posneg(text, cloud=None, batch=False, api_key=None, **kwargs):
:type text: str or unicode :type text: str or unicode
:rtype: Float :rtype: Float
""" """
url_params = {"batch": batch, "api_key": api_key}
return api_handler(text, cloud=cloud, api="sentiment", url_params={"batch":batch, "api_key":api_key}, **kwargs) return api_handler(text, cloud=cloud, api="sentiment", url_params=url_params, **kwargs)
def sentiment_hq(text, cloud=None, batch=False, api_key=None, **kwargs): def sentiment_hq(text, cloud=None, batch=False, api_key=None, **kwargs):
""" """
@@ -71,5 +71,5 @@ def sentiment_hq(text, cloud=None, batch=False, api_key=None, **kwargs):
:type text: str or unicode :type text: str or unicode
:rtype: Float :rtype: Float
""" """
url_params = {"batch": batch, "api_key": api_key}
return api_handler(text, cloud=cloud, api="sentimenthq", url_params={"batch":batch, "api_key":api_key}, **kwargs) return api_handler(text, cloud=cloud, api="sentimenthq", url_params=url_params, **kwargs)
+2 -2
View File
@@ -22,5 +22,5 @@ def text_tags(text, cloud=None, batch=False, api_key=None, **kwargs):
:type text: str or unicode :type text: str or unicode
:rtype: Dictionary of class probability pairs :rtype: Dictionary of class probability pairs
""" """
url_params = {"batch": batch, "api_key": api_key}
return api_handler(text, cloud=cloud, api="texttags", url_params={"batch":batch, "api_key":api_key}, **kwargs) return api_handler(text, cloud=cloud, api="texttags", url_params=url_params, **kwargs)
+2
View File
@@ -29,6 +29,8 @@ def api_handler(arg, cloud, api, url_params = {"batch":False, "api_key":None}, *
if apis: if apis:
url += "&apis=%s" % ",".join(apis) url += "&apis=%s" % ",".join(apis)
print url
response = requests.post(url, data=json_data, headers=JSON_HEADERS) response = requests.post(url, data=json_data, headers=JSON_HEADERS)
if response.status_code == 503 and cloud != None: if response.status_code == 503 and cloud != None:
raise IndicoError("Private cloud '%s' does not include api '%s'" % (cloud, api)) raise IndicoError("Private cloud '%s' does not include api '%s'" % (cloud, api))
+34 -16
View File
@@ -9,6 +9,7 @@ from indicoio import config
from indicoio import political, sentiment, fer, facial_features, language, image_features, text_tags from indicoio import political, sentiment, fer, facial_features, language, image_features, text_tags
from indicoio import batch_political, batch_sentiment, batch_fer, batch_facial_features from indicoio import batch_political, batch_sentiment, batch_fer, batch_facial_features
from indicoio import batch_language, batch_image_features, batch_text_tags from indicoio import batch_language, batch_image_features, batch_text_tags
from indicoio import keywords, batch_keywords
from indicoio import sentiment_hq, batch_sentiment_hq from indicoio import sentiment_hq, batch_sentiment_hq
from indicoio import predict_image, predict_text, batch_predict_image, batch_predict_text from indicoio import predict_image, predict_text, batch_predict_image, batch_predict_text
from indicoio.utils.errors import IndicoError from indicoio.utils.errors import IndicoError
@@ -32,18 +33,22 @@ class BatchAPIRun(unittest.TestCase):
response = batch_text_tags(test_data, api_key=self.api_key) response = batch_text_tags(test_data, api_key=self.api_key)
self.assertTrue(isinstance(response, list)) self.assertTrue(isinstance(response, list))
def test_batch_keywords(self):
test_data = ["A working api is key to the success of our young company"]
response = batch_keywords(test_data, api_key=self.api_key)
self.assertTrue(isinstance(response, list))
def test_batch_posneg(self): def test_batch_posneg(self):
test_data = ['Worst song ever', 'Best song ever'] test_data = ['Worst song ever', 'Best song ever']
response = batch_sentiment(test_data, api_key=self.api_key) response = batch_sentiment(test_data, api_key=self.api_key)
self.assertTrue(isinstance(response, list)) self.assertTrue(isinstance(response, list))
self.assertTrue(response[0] < 0.5) self.assertTrue(response[0] < 0.5)
# TODO: uncomment once the high quality sentiment API is publicly released def test_batch_sentiment_hq(self):
# def test_batch_sentiment_hq(self): test_data = ['Worst song ever', 'Best song ever']
# test_data = ['Worst song ever', 'Best song ever'] response = batch_sentiment_hq(test_data, api_key=self.api_key)
# response = batch_sentiment_hq(test_data, api_key=self.api_key) self.assertTrue(isinstance(response, list))
# self.assertTrue(isinstance(response, list)) self.assertTrue(response[0] < 0.5)
# self.assertTrue(response[0] < 0.5)
def test_batch_political(self): def test_batch_political(self):
test_data = ["Guns don't kill people, people kill people."] test_data = ["Guns don't kill people, people kill people."]
@@ -202,6 +207,20 @@ class FullAPIRun(unittest.TestCase):
for v in results.values(): for v in results.values():
assert v >= 0.1 assert v >= 0.1
def test_keywords(self):
text = "A working api is key to the success of our young company"
results = keywords(text)
assert 'api' in results.keys()
results = keywords(text, top_n=3)
assert len(results) is 3
results = keywords(text, threshold=.1)
for v in results.values():
assert v >= .1
def test_political(self): def test_political(self):
political_set = set(['Libertarian', 'Liberal', 'Conservative', 'Green']) political_set = set(['Libertarian', 'Liberal', 'Conservative', 'Green'])
test_string = "Guns don't kill people, people kill people." test_string = "Guns don't kill people, people kill people."
@@ -228,18 +247,17 @@ class FullAPIRun(unittest.TestCase):
self.assertTrue(isinstance(response, float)) self.assertTrue(isinstance(response, float))
self.assertTrue(response > 0.5) self.assertTrue(response > 0.5)
# TODO: uncomment when the high quality sentiment API is publicly released def test_sentiment_hq(self):
# def test_sentiment_hq(self): test_string = "Worst song ever."
# test_string = "Worst song ever." response = sentiment_hq(test_string)
# response = sentiment_hq(test_string)
# self.assertTrue(isinstance(response, float)) self.assertTrue(isinstance(response, float))
# self.assertTrue(response < 0.5) self.assertTrue(response < 0.5)
# test_string = "Best song ever." test_string = "Best song ever."
# response = sentiment_hq(test_string) response = sentiment_hq(test_string)
# self.assertTrue(isinstance(response, float)) self.assertTrue(isinstance(response, float))
# self.assertTrue(response > 0.5) self.assertTrue(response > 0.5)
def test_good_fer(self): def test_good_fer(self):
fer_set = set(['Angry', 'Sad', 'Neutral', 'Surprise', 'Fear', 'Happy']) fer_set = set(['Angry', 'Sad', 'Neutral', 'Surprise', 'Fear', 'Happy'])