diff facturation.py @ 3:1c5097aea031 draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/facturation_ibps commit 6fd512a87951fcf82fe2c972d5f2d9d0c4facb11
author artbio
date Fri, 09 Nov 2018 05:59:20 -0500
parents 3bbcf49ad677
children ddc7b8073704
line wrap: on
line diff
--- a/facturation.py	Thu Nov 08 05:45:50 2018 -0500
+++ b/facturation.py	Fri Nov 09 05:59:20 2018 -0500
@@ -28,13 +28,14 @@
     # convert to unicode utf-8, remove &nbsp and €
     facture_html = facture_html.decode('utf-8')
     facture_html = facture_html.replace(r' ', r' ')
+    facture_html = facture_html.replace(r' €', '')
     facture_html = facture_html.replace(u' \u20ac', '')
     # parsing de la référence, de la date et de la période de facturation
     date = re.search(r'Paris le (.*?)</p>'.decode('utf-8'),
                      facture_html).group(1)
     periode = re.search(r'de la prestation (.*?)</p>'.decode('utf-8'),
                         facture_html).group(1)
-    ref = re.search(r'sur le bon de commande :\s*(.*?)<'.decode('utf-8'),
+    ref = re.search(r'rence interne d.*? :\s*(.*?)<'.decode('utf-8'),
                     facture_html).group(1)
 
     # parsing des tableaux html avec pandas
@@ -46,6 +47,8 @@
     # remove 'Adresse de l'appel à facturation : ' (\xa0:\xa0)
     adresse = facture_parsed[0].replace(
         r"Adresse de l\'appel \xe0 facturation : ", r'', regex=True)
+    adresse = adresse.replace(
+        r"Adresse du client : ", r'', regex=True)
     elements = facture_parsed[1]
 
     # conversion des noms de colonnes