You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
This document lists all Python packages pre-installed in Offline Python Runtime Docker container, organized by category with version information and use cases.
🗂️ Package Categories
📊 Data Science & Analytics
Package
Version
Description
Use Cases
pandas
Latest
Data manipulation and analysis
Data cleaning, transformation, analysis
numpy
Latest
Numerical computing
Scientific computing, array operations
scikit-learn
Latest
Machine learning library
Predictive modeling, data mining
matplotlib
Latest
Data visualization
Charts, plots, graphs
scipy
Latest
Scientific computing
Optimization, signal processing
🗄️ Database Connectivity
Package
Version
Description
Use Cases
oracledb
Latest
Oracle database driver
Oracle database connectivity
sqlalchemy
Latest
SQL toolkit and ORM
Multiple SQL database support
pymongo
Latest
MongoDB driver
NoSQL database operations
pyodbc
Latest
ODBC database driver
Generic database connectivity
mssql-python
Latest
Microsoft SQL Server driver
SQL Server connectivity
📈 Data Processing & ETL
Package
Version
Description
Use Cases
duckdb
Latest
In-process analytical database
High-performance analytics
dlt
Latest
Data loading tool
ETL pipeline orchestration
pyarrow
Latest
Columnar data format
Efficient data interchange
openpyxl
Latest
Excel file handling
Excel file read/write operations
tabulate
Latest
Table formatting
Data presentation, CLI output
pyreadstat
Latest
Statistical data files
SAS, SPSS file formats
🌐 Web & Networking
Package
Version
Description
Use Cases
requests
Latest
HTTP library
API calls, web requests
httpx
Latest
Async HTTP client
Modern async HTTP operations
urllib3
Latest
URL handling library
HTTP connection pooling
🔐 Security & Validation
Package
Version
Description
Use Cases
cryptography
Latest
Cryptographic recipes
Data encryption, security
pydantic
Latest
Data validation
Input validation, settings
🛠️ Development & Testing
Package
Version
Description
Use Cases
pytest
Latest
Testing framework
Unit testing, integration tests
ipykernel
Latest
Jupyter kernel
Notebook development, debugging
⚙️ Configuration & Environment
Package
Version
Description
Use Cases
python-dotenv
Latest
Environment variable management
Configuration management
📋 Complete Package List
# Get package information in containerpodmanrun-itoffline-python-runtime:latestpython-c "
importpkg_resourcesimportsysprint('🐍 Python Version:', sys.version)
print('\n📦 Installed Packages:')
packages= [dfordinpkg_resources.working_set]
packages.sort(key=lambdax: x.project_name.lower())
forpkginpackages:
version=pkg.versionifhasattr(pkg, 'version') else'Unknown'print(f' {pkg.project_name:<25}{version}')
print(f'\n📊 Total packages: {len(packages)}')
"
# Enterprise ETL with dlt and DuckDBimportdltimportduckdbimportpandasaspd@dlt.sourcedeforacle_source():
"""Dlt source for Oracle data"""# Connect to Oracle and extract dataquery="SELECT * FROM source_table WHERE updated_date > '{start_date}'"# Implementation would connect to Oraclereturn [{"data": "sample_row_1"}, {"data": "sample_row_2"}]
@dlt.resourcedefprocessed_data():
"""Transform data with DuckDB"""# Get raw data from sourceraw_data=oracle_source()
# Process with DuckDBconn=duckdb.connect(':memory:')
df=pd.DataFrame(raw_data)
conn.register('raw_data', df)
# Transformresult=conn.execute(""" SELECT data, LENGTH(data) as data_length, 'processed' as status FROM raw_data """).fetchdf()
returnresult.to_dict('records')
@dlt.destinationdeflocal_file_system(data):
"""Load to local file system"""df=pd.DataFrame(data)
df.to_csv('/home/appuser/output/processed_data.csv', index=False)
returnlen(df)
# ETL Pipelinepipeline=dlt.pipeline(
pipeline_name="oracle_etl",
destination=local_file_system
)
# Run pipelinepipeline.run(oracle_source() |processed_data())
🔧 Package Management
Check Package Updates
# Check for available updatesimportsubprocessimportjsondefcheck_updates():
"""Check for package updates"""packages= ['pandas', 'numpy', 'oracledb', 'scikit-learn']
forpackageinpackages:
try:
result=subprocess.run(
['pip', 'index', 'versions', package],
capture_output=True, text=True
)
ifresult.returncode==0:
versions=result.stdout.strip().split('\n')
iflen(versions) >1:
latest=versions[-1]
print(f"🔄 {package}: Update available - {latest}")
else:
print(f"✅ {package}: Up to date")
exceptExceptionase:
print(f"❌ {package}: Error checking updates - {e}")
Install Additional Packages
# Install packages in running container
podman exec -it python-runtime-container pip install --user <package-name># Install from requirements file
podman exec -it python-runtime-container pip install --user -r requirements.txt
# Install with specific version
podman exec -it python-runtime-container pip install --user <package>==<version># Install development packages
podman exec -it python-runtime-container pip install --user jupyter scipy seaborn
# Check for package conflicts
podman run -it offline-python-runtime:latest python -c "import pkg_resourcesimport warningsconflicts = []installed = {d.key: d.version for d in pkg_resources.working_set}for dist in pkg_resources.working_set: for req in dist.requires(): if req.key not in installed: conflicts.append(f'{dist.key} requires {req.key} but it is not installed')if conflicts: print('❌ Package conflicts found:') for conflict in conflicts: print(f' {conflict}')else: print('✅ No package conflicts detected')"
Version Compatibility
# Check Python 3.13 compatibility
podman run -it offline-python-runtime:latest python -c "import sysimport warningsprint(f'🐍 Python Version: {sys.version}')print(f'📦 Number of installed packages: {len(__import__(\"pkg_resources\").working_set)}')# Check for known compatibility issuesknown_issues = { 'pandas': 'Some deprecated features may be removed', 'scikit-learn': 'API changes in recent versions', 'oracledb': 'New thin/thick mode options'}for package, issue in known_issues.items(): try: __import__(package) print(f'⚠️ {package}: {issue}') except ImportError: print(f'❌ {package}: Not installed')"
📚 Package Documentation
Quick Reference Commands
# Get package help
podman exec -it python-runtime-container python -c "import pandas as pdhelp(pd.read_csv)# Get package versionpodman exec -it python-runtime-container python -c "
import oracledb
print(f'oracledb version: {oracledb.__version__}')
"# List package contentspodman exec -it python-runtime-container python -c "
import numpy as np
print('NumPy functions:')
print([attr forattrin dir(np) if not attr.startswith('_')])
"
Common Import Patterns
# Enterprise import patternsimportosimportsysfrompathlibimportPath# Data science importsimportpandasaspdimportnumpyasnpimportmatplotlib.pyplotaspltfromsklearn.ensembleimportRandomForestClassifier# Database importsimportoracledbimportpymongofromsqlalchemyimportcreate_engine# Data processing importsimportduckdbimportpyarrowimportdlt# Security and validationfromcryptography.fernetimportFernetfrompydanticimportBaseModel# Web and API importsimportrequestsimporthttpx# Development and testingimportpytestfromipykernelimportkernelappasapp# Configurationfromdotenvimportload_dotenv