Script Python permettant de nettoyer et préparer nos données csv.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

69 lines
1.5 KiB

2 years ago
  1. #Importation des données dont nous aurons besoin
  2. import pandas as pd
  3. import numpy as np
  4. import csv
  5. import re
  6. #Afficher les tableaux de données
  7. df = pd.read_csv("C:\Users\luigg\Data_cleaning\Table_final.csv")
  8. df.head(5)
  9. #Supprimer les colonnes inutilisées ou non pertinentes
  10. to_drop = ['identifiant
  11. ','adresse
  12. ','commune
  13. ','coordonnees_x
  14. ','coordonnees_y
  15. ','code_epsg
  16. ','code_ape
  17. ','libelle_ape
  18. ','code_eprtr
  19. ','libelle_eprtr
  20. ','sigleUniteLegale_imp
  21. ','activitePrincipaleUniteLegale_imp
  22. ','Catégorie_entreprise_imp
  23. ','numeroVoieEtablissement_imp
  24. ','typeVoieEtablissement_imp
  25. ','libelleVoieEtablissement_imp
  26. ','libelleCommuneEtablissement_imp
  27. ','codeCommuneEtablissement_imp
  28. ','adresse_imp
  29. ','geo_imp
  30. ','com_code_imp
  31. ','code_commune_imp
  32. ','Code Officiel_EPCI_imp
  33. ','Code_Officiel_region_imp
  34. ','codenaffix_imp
  35. ','Intitule_NAF_imp
  36. ','groupe_imp
  37. ','division_imp
  38. ','nom_etablissement_tndan
  39. ','code_operation_eliminatio_valorisation_tndan
  40. ','libelle_operation_eliminatio_valorisation_tndan
  41. ','code_departement_tndan
  42. ','pays_tndan
  43. ','pays_pdan
  44. ','code_dechet_pdan
  45. ','libelle_dechet_pdan
  46. ','quantite_pdan
  47. ','unite_pdan
  48. ','code_operation_eliminatio_valorisation_pndan
  49. ','libelle_operation_eliminatio_valorisation_pndan
  50. ','code_departement_pndan
  51. ','pays_pndan
  52. ','code_dechet_pndan
  53. ','libelle_dechet_pndan
  54. ','quantite_pndan
  55. ','unite_pndan
  56. ','code_operation_eliminatio_valorisation_tdan
  57. ','libelle_operation_eliminatio_valorisation_tdan
  58. ','code_departement_tdan
  59. ','pays_tdan
  60. ','code_dechet_tdan
  61. ','libelle_dechet_tdan
  62. ']
  63. df.drop(to_drop, inplace = True, axis = 1)
  64. df.head(5)