RubyGems - opener-opinion-detector-basic - Versions diffs - 1.0.0 - Mend

opener-opinion-detector-basic 1.0.0

Files changed (168) hide show

checksums.yaml +7 -0
data/README.md +30 -0
data/bin/opinion-detector-basic +19 -0
data/bin/opinion-detector-basic-server +10 -0
data/config.ru +4 -0
data/core/opinion_detector_basic_multi.py +499 -0
data/core/packages/KafNafParser-1.3.tar.gz +0 -0
data/core/packages/VUA_pylib-1.4.tar.gz +0 -0
data/core/site-packages/pre_build/VUKafParserPy-1.0-py2.7.egg-info/PKG-INFO +10 -0
data/core/site-packages/pre_build/VUKafParserPy-1.0-py2.7.egg-info/SOURCES.txt +7 -0
data/core/site-packages/pre_build/VUKafParserPy-1.0-py2.7.egg-info/dependency_links.txt +1 -0
data/core/site-packages/pre_build/VUKafParserPy-1.0-py2.7.egg-info/installed-files.txt +11 -0
data/core/site-packages/pre_build/VUKafParserPy-1.0-py2.7.egg-info/top_level.txt +1 -0
data/core/site-packages/pre_build/VUKafParserPy/KafDataObjectsMod.py +165 -0
data/core/site-packages/pre_build/VUKafParserPy/KafDataObjectsMod.pyc +0 -0
data/core/site-packages/pre_build/VUKafParserPy/KafParserMod.py +439 -0
data/core/site-packages/pre_build/VUKafParserPy/KafParserMod.pyc +0 -0
data/core/site-packages/pre_build/VUKafParserPy/__init__.py +7 -0
data/core/site-packages/pre_build/VUKafParserPy/__init__.pyc +0 -0
data/core/vendor/src/crfsuite/AUTHORS +1 -0
data/core/vendor/src/crfsuite/COPYING +27 -0
data/core/vendor/src/crfsuite/ChangeLog +103 -0
data/core/vendor/src/crfsuite/INSTALL +236 -0
data/core/vendor/src/crfsuite/Makefile.am +19 -0
data/core/vendor/src/crfsuite/Makefile.in +783 -0
data/core/vendor/src/crfsuite/README +183 -0
data/core/vendor/src/crfsuite/aclocal.m4 +9018 -0
data/core/vendor/src/crfsuite/autogen.sh +38 -0
data/core/vendor/src/crfsuite/compile +143 -0
data/core/vendor/src/crfsuite/config.guess +1502 -0
data/core/vendor/src/crfsuite/config.h.in +198 -0
data/core/vendor/src/crfsuite/config.sub +1714 -0
data/core/vendor/src/crfsuite/configure +14273 -0
data/core/vendor/src/crfsuite/configure.in +149 -0
data/core/vendor/src/crfsuite/crfsuite.sln +42 -0
data/core/vendor/src/crfsuite/depcomp +630 -0
data/core/vendor/src/crfsuite/example/chunking.py +49 -0
data/core/vendor/src/crfsuite/example/crfutils.py +179 -0
data/core/vendor/src/crfsuite/example/ner.py +270 -0
data/core/vendor/src/crfsuite/example/pos.py +78 -0
data/core/vendor/src/crfsuite/example/template.py +88 -0
data/core/vendor/src/crfsuite/frontend/Makefile.am +29 -0
data/core/vendor/src/crfsuite/frontend/Makefile.in +640 -0
data/core/vendor/src/crfsuite/frontend/dump.c +116 -0
data/core/vendor/src/crfsuite/frontend/frontend.vcxproj +129 -0
data/core/vendor/src/crfsuite/frontend/iwa.c +273 -0
data/core/vendor/src/crfsuite/frontend/iwa.h +65 -0
data/core/vendor/src/crfsuite/frontend/learn.c +439 -0
data/core/vendor/src/crfsuite/frontend/main.c +137 -0
data/core/vendor/src/crfsuite/frontend/option.c +93 -0
data/core/vendor/src/crfsuite/frontend/option.h +86 -0
data/core/vendor/src/crfsuite/frontend/readdata.h +38 -0
data/core/vendor/src/crfsuite/frontend/reader.c +136 -0
data/core/vendor/src/crfsuite/frontend/tag.c +427 -0
data/core/vendor/src/crfsuite/genbinary.sh.in +15 -0
data/core/vendor/src/crfsuite/include/Makefile.am +11 -0
data/core/vendor/src/crfsuite/include/Makefile.in +461 -0
data/core/vendor/src/crfsuite/include/crfsuite.h +1063 -0
data/core/vendor/src/crfsuite/include/crfsuite.hpp +555 -0
data/core/vendor/src/crfsuite/include/crfsuite_api.hpp +400 -0
data/core/vendor/src/crfsuite/include/os.h +61 -0
data/core/vendor/src/crfsuite/install-sh +520 -0
data/core/vendor/src/crfsuite/lib/cqdb/COPYING +28 -0
data/core/vendor/src/crfsuite/lib/cqdb/Makefile.am +21 -0
data/core/vendor/src/crfsuite/lib/cqdb/Makefile.in +549 -0
data/core/vendor/src/crfsuite/lib/cqdb/cqdb.vcxproj +86 -0
data/core/vendor/src/crfsuite/lib/cqdb/include/cqdb.h +524 -0
data/core/vendor/src/crfsuite/lib/cqdb/src/cqdb.c +587 -0
data/core/vendor/src/crfsuite/lib/cqdb/src/lookup3.c +976 -0
data/core/vendor/src/crfsuite/lib/crf/Makefile.am +46 -0
data/core/vendor/src/crfsuite/lib/crf/Makefile.in +721 -0
data/core/vendor/src/crfsuite/lib/crf/crf.vcxproj +216 -0
data/core/vendor/src/crfsuite/lib/crf/src/crf1d.h +353 -0
data/core/vendor/src/crfsuite/lib/crf/src/crf1d_context.c +705 -0
data/core/vendor/src/crfsuite/lib/crf/src/crf1d_encode.c +943 -0
data/core/vendor/src/crfsuite/lib/crf/src/crf1d_feature.c +352 -0
data/core/vendor/src/crfsuite/lib/crf/src/crf1d_model.c +994 -0
data/core/vendor/src/crfsuite/lib/crf/src/crf1d_tag.c +550 -0
data/core/vendor/src/crfsuite/lib/crf/src/crfsuite.c +492 -0
data/core/vendor/src/crfsuite/lib/crf/src/crfsuite_internal.h +236 -0
data/core/vendor/src/crfsuite/lib/crf/src/crfsuite_train.c +272 -0
data/core/vendor/src/crfsuite/lib/crf/src/dataset.c +106 -0
data/core/vendor/src/crfsuite/lib/crf/src/dictionary.c +118 -0
data/core/vendor/src/crfsuite/lib/crf/src/holdout.c +80 -0
data/core/vendor/src/crfsuite/lib/crf/src/logging.c +91 -0
data/core/vendor/src/crfsuite/lib/crf/src/logging.h +48 -0
data/core/vendor/src/crfsuite/lib/crf/src/params.c +335 -0
data/core/vendor/src/crfsuite/lib/crf/src/params.h +80 -0
data/core/vendor/src/crfsuite/lib/crf/src/quark.c +172 -0
data/core/vendor/src/crfsuite/lib/crf/src/quark.h +46 -0
data/core/vendor/src/crfsuite/lib/crf/src/rumavl.c +1107 -0
data/core/vendor/src/crfsuite/lib/crf/src/rumavl.h +160 -0
data/core/vendor/src/crfsuite/lib/crf/src/train_arow.c +408 -0
data/core/vendor/src/crfsuite/lib/crf/src/train_averaged_perceptron.c +242 -0
data/core/vendor/src/crfsuite/lib/crf/src/train_l2sgd.c +507 -0
data/core/vendor/src/crfsuite/lib/crf/src/train_lbfgs.c +338 -0
data/core/vendor/src/crfsuite/lib/crf/src/train_passive_aggressive.c +435 -0
data/core/vendor/src/crfsuite/lib/crf/src/vecmath.h +341 -0
data/core/vendor/src/crfsuite/ltmain.sh +8413 -0
data/core/vendor/src/crfsuite/missing +376 -0
data/core/vendor/src/crfsuite/swig/Makefile.am +13 -0
data/core/vendor/src/crfsuite/swig/Makefile.in +365 -0
data/core/vendor/src/crfsuite/swig/crfsuite.cpp +2 -0
data/core/vendor/src/crfsuite/swig/export.i +32 -0
data/core/vendor/src/crfsuite/swig/python/README +92 -0
data/core/vendor/src/crfsuite/swig/python/crfsuite.py +329 -0
data/core/vendor/src/crfsuite/swig/python/export_wrap.cpp +14355 -0
data/core/vendor/src/crfsuite/swig/python/export_wrap.h +63 -0
data/core/vendor/src/crfsuite/swig/python/prepare.sh +9 -0
data/core/vendor/src/crfsuite/swig/python/sample_tag.py +52 -0
data/core/vendor/src/crfsuite/swig/python/sample_train.py +68 -0
data/core/vendor/src/crfsuite/swig/python/setup.py +44 -0
data/core/vendor/src/crfsuite/win32/stdint.h +679 -0
data/core/vendor/src/liblbfgs/AUTHORS +1 -0
data/core/vendor/src/liblbfgs/COPYING +22 -0
data/core/vendor/src/liblbfgs/ChangeLog +120 -0
data/core/vendor/src/liblbfgs/INSTALL +231 -0
data/core/vendor/src/liblbfgs/Makefile.am +10 -0
data/core/vendor/src/liblbfgs/Makefile.in +638 -0
data/core/vendor/src/liblbfgs/NEWS +0 -0
data/core/vendor/src/liblbfgs/README +71 -0
data/core/vendor/src/liblbfgs/aclocal.m4 +6985 -0
data/core/vendor/src/liblbfgs/autogen.sh +38 -0
data/core/vendor/src/liblbfgs/config.guess +1411 -0
data/core/vendor/src/liblbfgs/config.h.in +64 -0
data/core/vendor/src/liblbfgs/config.sub +1500 -0
data/core/vendor/src/liblbfgs/configure +21146 -0
data/core/vendor/src/liblbfgs/configure.in +107 -0
data/core/vendor/src/liblbfgs/depcomp +522 -0
data/core/vendor/src/liblbfgs/include/lbfgs.h +745 -0
data/core/vendor/src/liblbfgs/install-sh +322 -0
data/core/vendor/src/liblbfgs/lbfgs.sln +26 -0
data/core/vendor/src/liblbfgs/lib/Makefile.am +24 -0
data/core/vendor/src/liblbfgs/lib/Makefile.in +499 -0
data/core/vendor/src/liblbfgs/lib/arithmetic_ansi.h +133 -0
data/core/vendor/src/liblbfgs/lib/arithmetic_sse_double.h +294 -0
data/core/vendor/src/liblbfgs/lib/arithmetic_sse_float.h +298 -0
data/core/vendor/src/liblbfgs/lib/lbfgs.c +1371 -0
data/core/vendor/src/liblbfgs/lib/lib.vcxproj +95 -0
data/core/vendor/src/liblbfgs/ltmain.sh +6426 -0
data/core/vendor/src/liblbfgs/missing +353 -0
data/core/vendor/src/liblbfgs/sample/Makefile.am +15 -0
data/core/vendor/src/liblbfgs/sample/Makefile.in +433 -0
data/core/vendor/src/liblbfgs/sample/sample.c +81 -0
data/core/vendor/src/liblbfgs/sample/sample.cpp +126 -0
data/core/vendor/src/liblbfgs/sample/sample.vcxproj +105 -0
data/core/vendor/src/svm_light/LICENSE.txt +59 -0
data/core/vendor/src/svm_light/Makefile +105 -0
data/core/vendor/src/svm_light/kernel.h +40 -0
data/core/vendor/src/svm_light/svm_classify.c +197 -0
data/core/vendor/src/svm_light/svm_common.c +985 -0
data/core/vendor/src/svm_light/svm_common.h +301 -0
data/core/vendor/src/svm_light/svm_hideo.c +1062 -0
data/core/vendor/src/svm_light/svm_learn.c +4147 -0
data/core/vendor/src/svm_light/svm_learn.h +169 -0
data/core/vendor/src/svm_light/svm_learn_main.c +397 -0
data/core/vendor/src/svm_light/svm_loqo.c +211 -0
data/ext/hack/Rakefile +17 -0
data/ext/hack/support.rb +88 -0
data/lib/opener/opinion_detector_basic.rb +91 -0
data/lib/opener/opinion_detector_basic/public/markdown.css +284 -0
data/lib/opener/opinion_detector_basic/server.rb +16 -0
data/lib/opener/opinion_detector_basic/version.rb +5 -0
data/lib/opener/opinion_detector_basic/views/index.erb +97 -0
data/lib/opener/opinion_detector_basic/views/result.erb +15 -0
data/opener-opinion-detector-basic.gemspec +36 -0
data/pre_build_requirements.txt +1 -0
metadata +309 -0

checksums.yaml ADDED Viewed

@@ -0,0 +1,7 @@
+---
+SHA1:
+  metadata.gz: cc6dd6c71396853ddb39ff898599ad4c3f466401
+  data.tar.gz: c820abad54167482947c7a56d78cba5331482957
+SHA512:
+  metadata.gz: ee6555c6dee3540ed4b7a7817e106cfb459281f159c60d73b2af548b9bc19b967ce70bc52e8bac991eabdab6b74a6d30606f7672c339d75c999bf2666a8a66ec
+  data.tar.gz: 72fc4d27ce5b98fab608880492a2c7b135e24542eb9b2cb26b3bd4c32008095f966ec944588d30aaeb278c265bdb65bd22688dd43649df7cd16d9ea0e99ece55

data/README.md ADDED Viewed

@@ -0,0 +1,30 @@
+Opinion Detector Basic
+======================
+This module implements a opinion detector for English (also works for Dutch and
+German). The language is determined by the "xml:lang" attribut in the input KAF
+file. Depending on the value of this attribute, the corresponding lexicon will
+be loaded. This module detects three elements of the opinions:
+* Expression: the actual opinion expression
+* Target: about what is the previous expression
+* Holder: who is stating that expression
+Requirements
+-----------
+* VUKafParserPy: parser in python for KAF files
+* lxml: library for processing xml in python
+Usage
+----
+The input KAF file has to be annotated with at least the term layer, with
+polarity information.  Correct input files for this module are the output KAF
+files from the polarity tagger module
+To tag an input KAF file example.kaf with opinions you can run:
+    $ cat example.with.polaritieskaf | core/opinion_detector_basic_multi.py > output.with.opinions.kaf
+The output will the input KAF file extended with the opinion layer.

data/bin/opinion-detector-basic ADDED Viewed

@@ -0,0 +1,19 @@
+#!/usr/bin/env ruby
+require_relative '../lib/opener/opinion_detector_basic'
+# STDIN.tty? returns `false` if data is being piped into the current process.
+if STDIN.tty?
+  input = nil
+else
+  input = STDIN.read
+end
+kernel                  = Opener::OpinionDetectorBasic.new(:args => ARGV)
+stdout, stderr, process = kernel.run(input)
+if process.success?
+  puts stdout
+else
+  abort stderr
+end

data/bin/opinion-detector-basic-server ADDED Viewed

@@ -0,0 +1,10 @@
+#!/usr/bin/env ruby
+require 'rack'
+# Without calling `Rack::Server#options` manually the CLI arguments will never
+# be passed, thus the application can't be specified as a constructor argument.
+server                  = Rack::Server.new
+server.options[:config] = File.expand_path('../../config.ru', __FILE__)
+server.start

data/config.ru ADDED Viewed

@@ -0,0 +1,4 @@
+require File.expand_path('../lib/opener/opinion_detector_basic', __FILE__)
+require File.expand_path('../lib/opener/opinion_detector_basic/server', __FILE__)
+run Opener::OpinionDetectorBasic::Server

data/core/opinion_detector_basic_multi.py ADDED Viewed

@@ -0,0 +1,499 @@
+#!/usr/bin/env python
+import sys
+import getopt
+import os
+this_folder = os.path.dirname(os.path.realpath(__file__))
+# This updates the load path to ensure that the local site-packages directory
+# can be used to load packages (e.g. a locally installed copy of lxml).
+sys.path.append(os.path.join(this_folder, 'site-packages/pre_build'))
+from VUKafParserPy import KafParser
+from collections import defaultdict
+import operator
+import pprint
+import lxml
+from lxml import etree
+import logging
+def mix_lists(l1,l2):
+  newl=[]
+  min_l = min(len(l1),len(l2))
+  for x in range(min_l):
+    newl.append(l1[x])
+    newl.append(l2[x])
+  if len(l1)>len(l2):
+    newl.extend(l1[min_l:])
+  elif len(l2)>len(l1):
+   newl.extend(l2[min_l:])
+  return newl
+class OpinionExpression:
+    def __init__(self,spans,sentence,value):
+        self.ids = spans
+        self.sentence = sentence
+        self.value = value
+        self.target_ids = []
+        self.candidates_r=[]
+        self.candidates_l=[]
+        self.holder = []
+    def __repr__(self):
+        r='Ids:'+'#'.join(self.ids)+' Sent:'+self.sentence+' Value:'+str(self.value)+ ' Target:'+'#'.join(self.target_ids)+'\n'
+        r+='Right cand: '+str(self.candidates_r)+'\n'
+        r+='Left cand: '+str(self.candidates_l)+'\n'
+        return r
+class MyToken:
+    def __init__(self,id,lemma,pos,polarity,sent_mod,sent):
+        self.id = id
+        self.lemma = lemma
+        self.pos = pos
+        self.polarity = polarity
+        self.sent_mod = sent_mod
+        self.sentence = sent
+        self.use_it = True
+        self.list_ids = [id]
+        self.value = 0
+        if polarity == 'positive':
+            self.value = 1
+        elif polarity == 'negative':
+            self.value = -1
+        if sent_mod == 'intensifier':
+            self.value = 2
+        elif sent_mod == 'shifter':
+            self.value = -1
+    def isNegator(self):
+        return self.sent_mod == 'shifter'
+    def isIntensifier(self):
+        return self.sent_mod == 'intensifier'
+    def is_opinion_expression(self):
+        return self.use_it and self.polarity is not None
+    def __repr__(self):
+        if self.use_it:
+            return self.id+' lemma:'+self.lemma.encode('utf-8')+'.'+self.pos.encode('utf-8')+' pol:'+str(self.polarity)+' sentmod:'+str(self.sent_mod)+' sent:'+self.sentence+' use:'+str(self.use_it)+' list:'+'#'.join(self.list_ids)+' val:'+str(self.value)
+        else:
+            return '\t'+self.id+' lemma:'+self.lemma.encode('utf-8')+'.'+self.pos.encode('utf-8')+' pol:'+str(self.polarity)+' sentmod:'+str(self.sent_mod)+' sent:'+self.sentence+' use:'+str(self.use_it)+' list:'+'#'.join(self.list_ids)+' val:'+str(self.value)
+def obtain_opinion_expressions(tokens,lang='nl'):
+    logging.debug('  Obtaining opinion expressions')
+    my_tokens = tokens[:]
+    accumulate_several_modifiers = True
+    apply_modifiers = True
+    apply_conjunctions = True
+    ## Acumulate doble/triple intensifiers or negators
+    if accumulate_several_modifiers:
+        logging.debug('   Accumulating modifiers')
+        t = 0
+        while t < len(my_tokens):
+            if my_tokens[t].isNegator() or my_tokens[t].isIntensifier():
+                if t+1 < len(my_tokens) and ( my_tokens[t+1].isNegator() or my_tokens[t+1].isIntensifier()):
+                    ## There are 2 negators/intensifiers next to each other
+                    ## The first one is deactivated and the second one is modified
+                    my_tokens[t].use_it = False
+                    my_tokens[t+1].value *= my_tokens[t].value
+                    my_tokens[t+1].list_ids += my_tokens[t].list_ids
+                    logging.debug('    Accucumating '+'-'.join(my_tokens[t+1].list_ids))
+            t+=1
+    ###########################################
+    ##Apply intensifiers/negators over the next elements
+    if apply_modifiers:
+        logging.debug('   Applying modifiers')
+        t = 0
+        while t < len(my_tokens):
+            if my_tokens[t].use_it and (my_tokens[t].isNegator() or my_tokens[t].isIntensifier()):
+                ## Try to modify the next token:
+                if t+1<len(my_tokens):
+                    my_tokens[t+1].value *= my_tokens[t].value
+                    my_tokens[t+1].list_ids += my_tokens[t].list_ids
+                    my_tokens[t].use_it = False
+                    logging.debug('    Applied modifier over '+'-'.join(my_tokens[t+1].list_ids))
+            t += 1
+    ###########################################
+    if apply_conjunctions:
+        if lang=='nl':
+            concat = [',','en']
+        elif lang=='en':
+            concat = [',','and']
+        elif lang=='es':
+            concat = [',','y','e']
+        elif lang=='it':
+            concat = [',','e','ed']
+        elif lang=='de':
+            concat = [',','und']
+        elif lang == 'fr':
+            concat=[',','et']
+        logging.debug('  Applying conjunctions:'+str(concat))
+        t = 0
+        while t < len(my_tokens):
+          if my_tokens[t].use_it and my_tokens[t].value!=0: ## Find the first one
+            #print 'FOUND ',my_tokens[t]
+            logging.debug('    Found token '+str(my_tokens[t]))
+            list_aux = my_tokens[t].list_ids
+            used = [t]
+            value_aux = my_tokens[t].value
+            my_tokens[t].use_it = False
+            #print 'Modified',my_tokens[t]
+            x = t+1
+            while True:
+                if x>=len(my_tokens):
+                    break
+                if my_tokens[x].lemma in concat:
+                    ## list_aux += my_tokens[x].list_ids Dont use it as part of the OE
+                    my_tokens[x].use_it = False
+                    x+=1
+                elif (my_tokens[x].use_it and my_tokens[x].value!=0):
+                     #print '\Also ',my_tokens[x]
+                     logging.debug('    Found token '+str(my_tokens[x]))
+                     list_aux += my_tokens[x].list_ids
+                     used.append(x)
+                     my_tokens[x].use_it = False
+                     value_aux += my_tokens[x].value
+                     x += 1
+                else:
+                    break
+            #print 'OUT OF THE WHILE'
+            ##The last one in the list used is the one accumulating all
+            last_pos = used[-1]
+            my_tokens[last_pos].value = value_aux
+            my_tokens[last_pos].list_ids = list_aux
+            my_tokens[last_pos].use_it = True
+            logging.debug('    Regenerating '+str(my_tokens[last_pos]))
+            t = x ## next token
+            #print
+            #print
+          t += 1
+    ## Create OpinionExpression
+    my_opinion_exps = []
+    logging.debug('   Generating output')
+    for token in my_tokens:
+        if token.use_it and token.value != 0:
+            op_exp = OpinionExpression(token.list_ids,token.sentence,token.value)
+            my_opinion_exps.append(op_exp)
+    return my_opinion_exps
+'''
+def get_distance(id1, id2):
+    pos1 = int(id1[id1.find('_')+1:])
+    pos2 = int(id2[id2.find('_')+1:])
+    if pos1>pos2:
+        return pos1-pos2
+    else:
+        return pos2-pos1
+'''
+def obtain_holders(ops_exps,sentences,lang):
+    if lang=='nl':
+        holders = ['ik','we','wij','ze','zij','jullie','u','hij','het','jij','je','mij','me','hem','haar','ons','hen','hun']
+    elif lang=='en':
+        holders = ['i','we','he','she','they','it','you']
+    elif lang =='es':
+        holders = ['yo','tu','nosotros','vosotros','ellos','ellas','nosotras','vosotras']
+    elif lang =='it':
+        holders = ['io','tu','noi','voi','loro','lei','lui']
+    elif lang == 'de':
+        holders = ['ich','du','wir','ihr','sie','er']
+    elif lang == 'fr':
+        holders = ['je','tu','lui','elle','nous','vous','ils','elles']
+    logging.debug('Obtaining holders with list: '+str(holders))
+    for oe in ops_exps:
+        sent = oe.sentence
+        list_terms = sentences[str(sent)]
+        for lemma, pos, term_id in list_terms:
+            if lemma in holders:
+                oe.holder.append(term_id)
+                logging.debug('  Selected for '+str(oe)+' holder'+lemma+' '+term_id)
+                break
+#This is specific for the basic version
+def filter_candidates(candidates,ids_oe):
+  ##filtered  = [(lemma, pos,term_id) for (lemma,pos, term_id) in candidates if len(lemma)>=4 and term_id not in ids_oe]
+  filtered = [(lemma,pos,id) for (lemma,pos,id) in candidates if pos in ['N','R']]
+  return filtered
+def obtain_targets_improved(ops_exps,sentences):
+    logging.debug('  Obtaining targets improved')
+    #print>>sys.stderr,'#'*40
+    #print>>sys.stderr,'#'*40
+    #print>>sys.stderr,'Beginning with obtain targets'
+    ##sentences --> dict   [str(numsent)] ==> list of (lemma, term)id
+    all_ids_in_oe = []
+    for oe in ops_exps:
+        all_ids_in_oe.extend(oe.ids)
+    #print>>sys.stderr,'All list of ids in oe',all_ids_in_oe
+    for oe in ops_exps:
+        #print>>sys.stderr,'\tOE:',oe
+        logging.debug('   OpExp: '+str(oe))
+        ids_in_oe = oe.ids
+        sent = oe.sentence
+        list_terms = sentences[str(sent)]
+        #print>>sys.stderr,'\t\tTerms in sent:',list_terms
+        ###########################################
+        #First rule: noun to the right within maxdistance tokens
+        max_distance_right = 3
+        biggest_index = -1
+        for idx, (lemma,pos,term_id) in enumerate(list_terms):
+            if term_id in ids_in_oe:
+                biggest_index = idx
+        #print>>sys.stderr,'\t\tBI',biggest_index
+        if biggest_index+1 >= len(list_terms):  ## is the last element and we shall skip it
+            #print>>sys.stderr,'\t\tNot possible to apply 1st rule'
+            pass
+        else:
+            candidates=list_terms[biggest_index+1:min(biggest_index+1+max_distance_right,len(list_terms))]
+            ##Filter candidates
+            #print>>sys.stderr,'\t\tCandidates for right rule no filter',candidates
+            #oe.__candidates_right = [(lemma, term_id) for (lemma, term_id) in candidates if len(lemma)>=4 and term_id not in all_ids_in_oe]
+            oe.candidates_r = filter_candidates(candidates,all_ids_in_oe)
+            logging.debug('  Candidates filtered right'+str(oe.candidates_r))
+            #print>>sys.stderr,'\t\tCandidates for right rule no filter',oe.__candidates_right
+        ######################################################################################
+        ###########################################
+        max_distance_left = 3
+        smallest_index = 0
+        for idx,(lemma,pos,term_id) in enumerate(list_terms):
+            if term_id in ids_in_oe:
+                smallest_index = idx
+                break
+        #print>>sys.stderr,'Smalles index:',smallest_index
+        if smallest_index == 0:
+            #print>>sys.stderr,'\t\tNot possible to apply left rule'
+            pass
+        else:
+            candidates = list_terms[max(0,smallest_index-1-max_distance_left):smallest_index]
+            ##Filter candidates
+            #print>>sys.stderr,'\t\tCandidates for left rule no filter',candidates
+            oe.candidates_l = filter_candidates(candidates,all_ids_in_oe)
+            logging.debug('  Candidates filtered left: '+str(oe.candidates_l))
+        ######################################################################################
+    #print>>sys.stderr,'#'*40
+    #print>>sys.stderr,'#'*40
+    ## filling or.target_ids
+    assigned_as_targets = []
+    # First we assing to all the first in the right, if any, and not assigned
+    logging.debug(' Applying first to the right rule')
+    for oe in ops_exps:
+        #print>>sys.stderr,'A ver ',oe
+        if len(oe.candidates_r) !=0:
+            lemma, pos, id = oe.candidates_r[0]
+            if id not in assigned_as_targets:
+              oe.target_ids.append(id)
+              ###assigned_as_targets.append(id) 	#Uncomment to avoid selection of the same target moe than once
+              logging.debug('  OpExp '+str(oe)+' selected '+id)
+              #print>>sys.stderr,'Asignamos',id
+    logging.debug(' Applying most close rule')
+    for oe in ops_exps:
+        if len(oe.target_ids) == 0:  # otherwise it's solved
+            intercalados_list = mix_lists([id for _,_,id in oe.candidates_r],[id for _,_,id in oe.candidates_l])
+            for id in intercalados_list:
+                if id not in assigned_as_targets:
+                    oe.target_ids.append(id)
+                    ###assigned_as_targets.append(id)	#Uncomment to avoid selection of the same target moe than once
+                    logging.debug('  OpExp '+str(oe)+' selected '+id)
+                    break
+######## MAIN ROUTINE ############
+## Check if we are reading from a pipeline
+if sys.stdin.isatty():
+    print>>sys.stderr,'Input stream required.'
+    print>>sys.stderr,'Example usage: cat myUTF8file.kaf.xml |',sys.argv[0]
+    sys.exit(-1)
+########################################
+logging.basicConfig(stream=sys.stderr,format='%(asctime)s - %(levelname)s - %(message)s',level=logging.DEBUG)
+## Processing the parameters
+my_time_stamp = True
+remove_opinions = True
+opinion_strength = True
+try:
+    opts, args = getopt.getopt(sys.argv[1:],"",["no-time","no-remove-opinions","no-opinion-strength"])
+    for opt, arg in opts:
+        if opt == "--no-time":
+            my_time_stamp = False
+        elif opt == "--no-remove-opinions":
+            remove_opinions = False
+        elif opt == "--no-opinion-strength":
+            opinion_strength = False
+except getopt.GetoptError:
+    pass
+#########################################
+logging.debug('Include timestamp: '+str(my_time_stamp))
+# Parsing the KAF file
+try:
+    my_kaf_tree = KafParser(sys.stdin)
+except Exception as e:
+    print>>sys.stderr,'Error parsing input'
+    print>>sys.stderr,'Stream input must be a valid KAF file'
+    print>>sys.stderr,'Error: ',str(e)
+    sys.exit(-1)
+lang = my_kaf_tree.getLanguage()
+## Creating data structure
+sentences = defaultdict(list)
+my_tokens = []
+# CREATE the datastructure for the tokens
+n=0
+lemma_for_tid = {}
+for term in my_kaf_tree.getTerms():
+    n+=1
+    term_id = term.getId()
+    lemma = term.getLemma()
+    lemma_for_tid[term_id] = lemma
+    kaf_pos = term.getPos()
+    #print>>sys.stderr,kaf_pos
+    list_span = term.get_list_span()        ## List of token ids in the span layer of the term
+    sentiment = term.getSentiment()
+    polarity = sent_mod = None
+    if sentiment is not None:
+        polarity = sentiment.getPolarity()
+        sent_mod = sentiment.getSentimentModifier()
+    sentence = my_kaf_tree.getToken(list_span[0]).get('sent')   ## The sentence of the first token element in span
+    my_tokens.append(MyToken(term_id,lemma,kaf_pos,polarity,sent_mod,sentence))
+    sentences[str(sentence)].append((lemma,kaf_pos,term_id))
+#############################
+logging.debug('Num terms loaded: '+str(n))
+logging.debug('Num sentences: '+str(len(sentences)))
+logging.debug('Obtaining opinion expressions')
+my_ops_exps = obtain_opinion_expressions(my_tokens,lang)
+print>>sys.stderr,my_ops_exps
+logging.debug('Obtaining targets')
+obtain_targets_improved(my_ops_exps,sentences)
+logging.debug('Obtaining holders')
+obtain_holders(my_ops_exps,sentences,lang)
+## Create the elements
+logging.debug('Generating KAF output')
+if remove_opinions:
+    my_kaf_tree.remove_opinion_layer()
+for oe in my_ops_exps:
+    op_ele = etree.Element('opinion')
+    ## Holder
+    if len(oe.holder)!=0:
+      oe.holder.sort()
+      c = ' '.join(lemma_for_tid[tid] for tid in oe.holder)
+      op_hol = etree.Element('opinion_holder')
+      op_hol.append(etree.Comment(c))
+      op_ele.append(op_hol)
+      span_op_hol = etree.Element('span')
+      op_hol.append(span_op_hol)
+      for id in oe.holder:
+        span_op_hol.append(etree.Element('target',attrib={'id':id}))
+    ## Target
+    op_tar = etree.Element('opinion_target')
+    op_ele.append(op_tar)
+    if len(oe.target_ids)!=0:   ## if there are no targets, there is no opinion eleemnt
+      oe.target_ids.sort()
+      c = ' '.join(lemma_for_tid[tid] for tid in oe.target_ids)
+      op_tar.append(etree.Comment(c))
+      span_op_tar = etree.Element('span')
+      op_tar.append(span_op_tar)
+      for id in oe.target_ids:
+        span_op_tar.append(etree.Element('target',attrib={'id':id}))
+    #Expression
+    if oe.value > 0:  pol = 'positive'
+    elif oe.value < 0: pol = 'negative'
+    else:  pol = 'neutral'
+    op_exp = etree.Element('opinion_expression')
+    op_exp.set('polarity',pol)
+    if opinion_strength:
+        op_exp.set('strength',str(oe.value))
+    op_ele.append(op_exp)
+    oe.ids.sort()
+    c = ' '.join(lemma_for_tid[tid] for tid in oe.ids)
+    op_exp.append(etree.Comment(c))
+    span_exp = etree.Element('span')
+    op_exp.append(span_exp)
+    for id in oe.ids:
+      span_exp.append(etree.Element('target',attrib={'id':id}))
+    ##Append the op_ele to the opinions layer
+    my_kaf_tree.addElementToLayer('opinions', op_ele)
+my_kaf_tree.addLinguisticProcessor('Basic opinion detector with Pos','1.0','opinions', my_time_stamp)
+my_kaf_tree.saveToFile(sys.stdout)
+logging.debug('Process finished')