xls_pasrer.py 1018 B

123456789101112131415161718192021222324252627
  1. '''
  2. Created on Feb 14, 2020
  3. @author: deeejas
  4. '''
  5. import pandas as pd
  6. dtypes={'NETWEIGHT': 'int64', 'NETVALUE': 'int64'}
  7. df = pd.read_excel('intrastat.xlsx', dtype=dtypes) #, parse_dates=True, date_parser='DATA'
  8. # df['VSCODE'].dtype =
  9. # print(df['DATA'])
  10. # print(df['VSCODE'])
  11. # print(df.groupby(['VSCODE',
  12. # 'ACode', 'Bcode', 'DeliveryTermsCode',
  13. # 'TransportCode', 'CountryOfOrigin',
  14. # 'EXP'])['NETVALUE', 'NETWEIGHT'].sum())
  15. # print(df['VSCODE'])
  16. grouped_df = df.groupby(['VSCODE', 'ACode', 'Bcode', 'DeliveryTermsCode',
  17. 'TransportCode', 'CountryOfOrigin',
  18. 'EXP', 'SUPPL'])[['NETVALUE', 'NETWEIGHT', 'Q', 'SUPPLVALUE']].sum()
  19. print(grouped_df.index[0][7])
  20. # print(grouped_df.index[1][0])
  21. # print(grouped_df.columns)
  22. # for i in range(1, len(grouped_df)+1):
  23. # print(grouped_df['VSCODE'])
  24. # print(df_gr['NETVAELUE'].sum())
  25. # for columns in df.groupby(['VSCODE', 'EXP']).sum():
  26. # print(columns.title())