jam-EDA.py 1.0 KB

1234567891011121314151617181920212223242526272829303132333435
  1. # # import boto3
  2. # import pandas as pd
  3. # # import s3fs
  4. # df = pd.read_csv('s3://cse-cic-ids2018/Processed Traffic Data for ML Algorithms/Wednesday-28-02-2018_TrafficForML_CICFlowMeter.csv',low_memory=False)
  5. # df = df[df.Label != 'Label']
  6. # # df[100:101]
  7. # print(df[100:101])
  8. import s3fs
  9. fs = s3fs.S3FileSystem(anon=True)
  10. fs = s3fs.S3FileSystem(anon=True)
  11. fs.ls('cse-cic-ids2018')
  12. #s3://cse-cic-ids2018/Processed Traffic Data for ML Algorithms/Wednesday-28-02-2018_TrafficForML_CICFlowMeter.csv
  13. with fs.open('cse-cic-ids2018/Processed Traffic Data for ML Algorithms/Wednesday-28-02-2018_TrafficForML_CICFlowMeter.csv', 'r',encoding='utf-8') as f:
  14. reader = csv.reader(f)
  15. header = next(reader)
  16. print(header)
  17. i=0
  18. for row in reader:
  19. i=i+1
  20. if i<102 and i>98:
  21. print(i,row)
  22. len(csvdata)
  23. print(csvdata[0:1000])
  24. import pandas as pd
  25. csvdata = csvdata.decode('utf-8')
  26. data_frame = pd.read_csv(csvdata)
  27. print(len(data_frame))
  28. import csv
  29. reader = csv.reader(csvdata)
  30. print(next(reader))