mirror of https://github.com/minio/minio.git
				
				
				
			
		
			
	
	
		
			34 lines
		
	
	
		
			1.0 KiB
		
	
	
	
		
			Python
		
	
	
	
		
		
			
		
	
	
			34 lines
		
	
	
		
			1.0 KiB
		
	
	
	
		
			Python
		
	
	
	
| 
								 | 
							
								#!/usr/bin/env/env python3
							 | 
						||
| 
								 | 
							
								import boto3
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								s3 = boto3.client('s3',
							 | 
						||
| 
								 | 
							
								                  endpoint_url='http://localhost:9000',
							 | 
						||
| 
								 | 
							
								                  aws_access_key_id='minio',
							 | 
						||
| 
								 | 
							
								                  aws_secret_access_key='minio123',
							 | 
						||
| 
								 | 
							
								                  region_name='us-east-1')
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								r = s3.select_object_content(
							 | 
						||
| 
								 | 
							
								    Bucket='mycsvbucket',
							 | 
						||
| 
								 | 
							
								    Key='sampledata/TotalPopulation.csv.gz',
							 | 
						||
| 
								 | 
							
								    ExpressionType='SQL',
							 | 
						||
| 
								 | 
							
								    Expression="select * from s3object s where s.Location like '%United States%'",
							 | 
						||
| 
								 | 
							
								    InputSerialization={
							 | 
						||
| 
								 | 
							
								        'CSV': {
							 | 
						||
| 
								 | 
							
								            "FileHeaderInfo": "USE",
							 | 
						||
| 
								 | 
							
								        },
							 | 
						||
| 
								 | 
							
								        'CompressionType': 'GZIP',
							 | 
						||
| 
								 | 
							
								    },
							 | 
						||
| 
								 | 
							
								    OutputSerialization={'CSV': {}},
							 | 
						||
| 
								 | 
							
								)
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								for event in r['Payload']:
							 | 
						||
| 
								 | 
							
								    if 'Records' in event:
							 | 
						||
| 
								 | 
							
								        records = event['Records']['Payload'].decode('utf-8')
							 | 
						||
| 
								 | 
							
								        print(records)
							 | 
						||
| 
								 | 
							
								    elif 'Stats' in event:
							 | 
						||
| 
								 | 
							
								        statsDetails = event['Stats']['Details']
							 | 
						||
| 
								 | 
							
								        print("Stats details bytesScanned: ")
							 | 
						||
| 
								 | 
							
								        print(statsDetails['BytesScanned'])
							 | 
						||
| 
								 | 
							
								        print("Stats details bytesProcessed: ")
							 | 
						||
| 
								 | 
							
								        print(statsDetails['BytesProcessed'])
							 |