In [ ]:
!pip install paramiko
In [ ]:
import paramiko
import pandas as pd
from io import StringIO
# Replace with your SSH server details
ssh_server = ''''ssh.example.com''''
ssh_user = ''''your-username''''
ssh_password = ''''your-password''''
folder_path = ''''/path/to/your/folder/''''
# Connect to the SSH server
ssh = paramiko.SSHClient()
ssh.set_missing_host_key_policy(paramiko.AutoAddPolicy())
ssh.connect(ssh_server, username=ssh_user, password=ssh_password)
# List all files in the directory
stdin, stdout, stderr = ssh.exec_command(f''''ls {folder_path}'''')
files = stdout.read().decode().split()
# Read multiple CSV files into DataFrames
dfs = []
for file in files:
if file.endswith(''''.csv''''):
sftp = ssh.open_sftp()
with sftp.open(f''''{folder_path}/{file}'''', ''''r'''') as f:
data = f.read().decode(''''utf-8'''')
df = pd.read_csv(StringIO(data))
dfs.append(df)
sftp.close()
# Combine all DataFrames into one
combined_df = pd.concat(dfs, ignore_index=True)
print(combined_df.head())
# Close the SSH connection
ssh.close()