123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051 |
- #!/usr/bin/env python
- # -*- coding: utf-8 -*-
- #from __future__ import unicode_literals
- from pattern.fr import parse, split
- texte_brut = u"Le petit chat rugit alors que l'esclave humain tarde à accomplir sa tâche de nourrissage du maître et seigneur."
- texte_traite = parse( texte_brut )
- def imprimer_structure_mot ( mot ):
- '''imprime la structure de la phrase'''
- print 'index : ' + str( mot.index )
- print 'string : ' + str( mot.string )
- print '_custom_tags : ' + str( mot._custom_tags )
- print 'sentence : ' + str( mot.sentence )
- print 'pnp : ' + str( mot.pnp )
- print 'chunk : ' + str( mot.chunk )
- print 'lemma : ' + str( mot.lemma )
- print 'type : ' + str( mot.type )
- for phrase in split( texte_traite ):
- print "——————————"
- print "mots :"
- try:
- print phrase.words
- except Exception as e:
- print 'erreur : ' + str(e)
- print "——————————"
- print "groupes de mots :"
- try:
- print str(phrase.chunks)
- except Exception as e:
- print 'erreur : ' + str(e)
- print "——————————"
- print "structure, phrase :"
- try:
- print phrase.__dict__.keys()
- except Exception as e:
- print '💩 erreur : ' + str(e)
- print "——————————"
- print "structure, mot :"
- try:
- print phrase.words[0].__dict__.keys()
- except Exception as e:
- print 'erreur : ' + str(e)
- print "——————————"
- print "structure, chunk (groupe de mots) :"
- print phrase.chunks[0].__dict__.keys()
|