runpod
diff --git a/‎.github/workflows/CI-pylint.yml
+2-2 b/‎.github/workflows/CI-pylint.yml
+2-2
diff --git a/‎.github/workflows/CI-pytests.yml
+2-2 b/‎.github/workflows/CI-pytests.yml
+2-2
diff --git a/‎CONTRIBUTING.md
+1-1 b/‎CONTRIBUTING.md
+1-1
diff --git a/‎examples/endpoints/asyncio_job_request.py
+2-3 b/‎examples/endpoints/asyncio_job_request.py
+2-3
diff --git a/‎pyproject.toml
+4-3 b/‎pyproject.toml
+4-3
diff --git a/‎pytest.ini
+4 b/‎pytest.ini
+4
diff --git a/‎requirements.txt
+1 b/‎requirements.txt
+1
diff --git a/‎runpod/__init__.py
+1-3 b/‎runpod/__init__.py
+1-3
diff --git a/‎runpod/api/graphql.py
+3-1 b/‎runpod/api/graphql.py
+3-1
diff --git a/‎runpod/cli/groups/pod/commands.py
+7-3 b/‎runpod/cli/groups/pod/commands.py
+7-3
diff --git a/‎runpod/endpoint/asyncio/asyncio_runner.py
+5-4 b/‎runpod/endpoint/asyncio/asyncio_runner.py
+5-4
diff --git a/‎runpod/http_client.py
+95 b/‎runpod/http_client.py
+95
diff --git a/‎runpod/serverless/modules/rp_fastapi.py
+2-1 b/‎runpod/serverless/modules/rp_fastapi.py
+2-1
diff --git a/‎runpod/serverless/modules/rp_http.py
+10-7 b/‎runpod/serverless/modules/rp_http.py
+10-7
diff --git a/‎runpod/serverless/modules/rp_job.py
+3-5 b/‎runpod/serverless/modules/rp_job.py
+3-5
diff --git a/‎runpod/serverless/modules/rp_logger.py
+8-2 b/‎runpod/serverless/modules/rp_logger.py
+8-2
@@ -31,7 +31,7 @@ jobs:
       - name: Install Dependencies
         run: |
           python -m pip install --upgrade pip
-          pip install .[test]
+          pip install '.[test]'
 
       - name: Pylint Source
-        run: pylint --ignore-paths='build/*' --ignore='_version.py' $(find . -type f -name '*.py') \
+        run: pylint $(git ls-files '*.py')
@@ -30,7 +30,7 @@ jobs:
       - name: Install Dependencies
         run: |
           python -m pip install --upgrade pip
-          pip install .[test]
+          pip install '.[test]'
 
       - name: Run Tests
-        run: pytest --cov-config=.coveragerc --timeout=120 --timeout_method=thread --cov=runpod --cov-report=xml --cov-report=term-missing --cov-fail-under=100 -W error -p no:cacheprovider -p no:unraisableexception
+        run: pytest --cov-config=.coveragerc --timeout=120 --timeout_method=thread --cov=runpod --cov-report=xml --cov-report=term-missing --cov-fail-under=98 -W error -p no:cacheprovider -p no:unraisableexception
@@ -35,7 +35,7 @@ Here is a quick guide on how to contribute code to this project:
 6. Run tests to ensure that your changes do not break any existing functionality. You can run tests using the following command:
 
     ```bash
-    pip install .[test]
+    pip install '.[test]'
     pytest
     ```
 
 
@@ -3,10 +3,9 @@
 """
 
 import asyncio
-import aiohttp
 
 import runpod
-from runpod import AsyncioEndpoint, AsyncioJob
+from runpod import http_client, AsyncioEndpoint, AsyncioJob
 
 asyncio.set_event_loop_policy(asyncio.WindowsSelectorEventLoopPolicy())  # For Windows Users
 
@@ -17,7 +16,7 @@ async def main():
     '''
     Function to run the example.
     '''
-    async with aiohttp.ClientSession() as session:
+    async with http_client.AsyncClientSession() as session:
         # Invoke API
         payload = {}
         endpoint = AsyncioEndpoint("ENDPOINT_ID", session)
 
@@ -54,11 +54,12 @@ runpod = "runpod.cli.entry:runpod_cli"
 test = [
     "asynctest",
     "nest_asyncio",
-    "pylint",
-    "pytest",
+    "pylint==3.2.5",
+    "pytest-asyncio",
     "pytest-cov",
     "pytest-timeout",
-    "pytest-asyncio",
+    "pytest-watch",
+    "pytest",
 ]
 
 [build-system]
 
@@ -0,0 +1,4 @@
+[pytest]
+addopts = --durations=10 --cov-config=.coveragerc --timeout=120 --timeout_method=thread --cov=runpod --cov-report=xml --cov-report=term-missing --cov-fail-under=98 -W error -p no:cacheprovider -p no:unraisableexception
+python_files = tests.py test_*.py *_test.py
+norecursedirs = venv *.egg-info .git build
@@ -5,6 +5,7 @@ backoff >= 2.2.1
 boto3 >= 1.26.165
 click >= 8.1.7
 colorama >= 0.2.5, < 0.4.7
+cryptography < 43.0.0
 fastapi[all] >= 0.94.0
 paramiko >= 3.3.1
 prettytable >= 3.9.0
 
@@ -42,9 +42,7 @@
 else:
     api_key = None  # pylint: disable=invalid-name
 
-api_url_base = "https://api.runpod.io"  # pylint: disable=invalid-name
-
-endpoint_url_base = "https://api.runpod.ai/v2"  # pylint: disable=invalid-name
+endpoint_url_base = os.environ.get("RUNPOD_ENDPOINT_BASE_URL", "https://api.runpod.ai/v2")  # pylint: disable=invalid-name
 
 
 # --------------------------- Force Logging Levels --------------------------- #
 
@@ -3,6 +3,7 @@
 """
 
 import json
+import os
 from typing import Any, Dict
 
 import requests
@@ -18,7 +19,8 @@ def run_graphql_query(query: str) -> Dict[str, Any]:
     Run a GraphQL query
     '''
     from runpod import api_key  # pylint: disable=import-outside-toplevel, cyclic-import
-    url = f"https://api.runpod.io/graphql?api_key={api_key}"
+    api_url_base = os.environ.get("RUNPOD_API_BASE_URL", "https://api.runpod.io")
+    url = f"{api_url_base}/graphql?api_key={api_key}"
 
     headers = {
         "Content-Type": "application/json",
 
@@ -33,19 +33,23 @@ def create_new_pod(name, image, gpu_type, gpu_count, support_public_ip): # pylin
     '''
     Creates a pod.
     '''
+    kwargs = {
+        "gpu_count": gpu_count,
+        "support_public_ip": support_public_ip,
+    }
+
     if not name:
         name = click.prompt('Enter pod name', default='RunPod-CLI-Pod')
 
     quick_launch = click.confirm('Would you like to launch default pod?', abort=True)
     if quick_launch:
         image = 'runpod/base:0.0.0'
         gpu_type = 'NVIDIA GeForce RTX 3090'
-        ports ='22/tcp'
+        kwargs["ports"] ='22/tcp'
 
         click.echo('Launching default pod...')
 
-    new_pod = create_pod(name, image, gpu_type,
-                         gpu_count=gpu_count, support_public_ip=support_public_ip, ports=ports)
+    new_pod = create_pod(name, image, gpu_type, **kwargs)
 
     click.echo(f'Pod {new_pod["id"]} has been created.')
 
 
@@ -3,22 +3,23 @@
 
 from typing import Any, Dict
 import asyncio
-import aiohttp
 
+from runpod.http_client import ClientSession
 from runpod.endpoint.helpers import FINAL_STATES, is_completed
 
 
 class Job:
     """Class representing a job for an asynchronous endpoint"""
 
-    def __init__(self, endpoint_id: str, job_id: str, session: aiohttp.ClientSession):
+    def __init__(self, endpoint_id: str, job_id: str, session: ClientSession):
         from runpod import api_key, endpoint_url_base  # pylint: disable=import-outside-toplevel,cyclic-import
 
         self.endpoint_id = endpoint_id
         self.job_id = job_id
         self.headers = {
             "Content-Type": "application/json",
-            "Authorization": f"Bearer {api_key}"
+            "Authorization": f"Bearer {api_key}",
+            "X-Request-ID": job_id,
         }
         self.session = session
         self.endpoint_url_base = endpoint_url_base
@@ -100,7 +101,7 @@ async def cancel(self) -> dict:
 class Endpoint:
     """Class for running endpoint"""
 
-    def __init__(self, endpoint_id: str, session: aiohttp.ClientSession):
+    def __init__(self, endpoint_id: str, session: ClientSession):
         from runpod import api_key, endpoint_url_base  # pylint: disable=import-outside-toplevel
 
         self.endpoint_id = endpoint_id
 
@@ -0,0 +1,95 @@
+"""
+HTTP Client abstractions
+"""
+
+import os
+import requests
+from aiohttp import (
+    ClientSession,
+    ClientTimeout,
+    TCPConnector,
+)
+from .tracer import (
+    create_aiohttp_tracer,
+    create_request_tracer,
+)
+from .cli.groups.config.functions import get_credentials
+from .user_agent import USER_AGENT
+
+
+def get_auth_header():
+    """
+    Produce a header dict with the `Authorization` key derived from
+    credentials.get("api_key") OR os.getenv('RUNPOD_AI_API_KEY')
+    """
+    if credentials := get_credentials():
+        auth = credentials.get("api_key", "")
+    else:
+        auth = os.getenv("RUNPOD_AI_API_KEY", "")
+
+    return {
+        "Content-Type": "application/json",
+        "Authorization": auth,
+        "User-Agent": USER_AGENT,
+    }
+
+
+def AsyncClientSession(*args, **kwargs): # pylint: disable=invalid-name
+    """
+    Deprecation from aiohttp.ClientSession forbids inheritance.
+    This is now a factory method
+    TODO: use httpx
+    """
+    return ClientSession(
+        connector=TCPConnector(limit=0),
+        headers=get_auth_header(),
+        timeout=ClientTimeout(600, ceil_threshold=400),
+        trace_configs=[create_aiohttp_tracer()],
+        *args,
+        **kwargs,
+    )
+
+
+class SyncClientSession(requests.Session):
+    """
+    Inherits requests.Session to override `request()` method for tracing
+    TODO: use httpx
+    """
+
+    def request(self, method, url, **kwargs):  # pylint: disable=arguments-differ
+        """
+        Override for tracing. Not using super().request()
+        to capture metrics for connection and transfer times
+        """
+        with create_request_tracer() as tracer:
+            # Separate out the kwargs that are not applicable to `requests.Request`
+            request_kwargs = {
+                k: v
+                for k, v in kwargs.items()
+                # contains the names of the arguments
+                if k in requests.Request.__init__.__code__.co_varnames
+            }
+
+            # Separate out the kwargs that are applicable to `requests.Request`
+            send_kwargs = {k: v for k, v in kwargs.items() if k not in request_kwargs}
+
+            # Create a PreparedRequest object to hold the request details
+            req = requests.Request(method, url, **request_kwargs)
+            prepped = self.prepare_request(req)
+            tracer.request = prepped  # Assign the request to the tracer
+
+            # Merge environment settings
+            settings = self.merge_environment_settings(
+                prepped.url,
+                send_kwargs.get("proxies"),
+                send_kwargs.get("stream"),
+                send_kwargs.get("verify"),
+                send_kwargs.get("cert"),
+            )
+            send_kwargs.update(settings)
+
+            # Send the request
+            response = self.send(prepped, **send_kwargs)
+            tracer.response = response  # Assign the response to the tracer
+
+            return response
@@ -18,6 +18,7 @@
 from .worker_state import Jobs
 from .rp_ping import Heartbeat
 from ...version import __version__ as runpod_version
+from ...http_client import SyncClientSession
 
 
 RUNPOD_ENDPOINT_ID = os.environ.get("RUNPOD_ENDPOINT_ID", None)
@@ -157,7 +158,7 @@ def _send_webhook(url: str, payload: Dict[str, Any]) -> bool:
     Returns:
         bool: True if the request was successful, False otherwise.
     """
-    with requests.Session() as session:
+    with SyncClientSession() as session:
         try:
             response = session.post(url, json=payload, timeout=10)
             response.raise_for_status()  # Raises exception for 4xx/5xx responses
 
@@ -4,9 +4,9 @@
 
 import os
 import json
-import aiohttp
-from aiohttp_retry import RetryClient, ExponentialRetry
-
+from aiohttp import ClientError
+from aiohttp_retry import RetryClient, FibonacciRetry
+from runpod.http_client import ClientSession
 from runpod.serverless.modules.rp_logger import RunPodLogger
 from .worker_state import Jobs, WORKER_ID
 
@@ -20,11 +20,11 @@
 job_list = Jobs()
 
 
-async def _transmit(client_session, url, job_data):
+async def _transmit(client_session: ClientSession, url, job_data):
     """
     Wrapper for transmitting results via POST.
     """
-    retry_options = ExponentialRetry(attempts=3)
+    retry_options = FibonacciRetry(attempts=3)
     retry_client = RetryClient(client_session=client_session, retry_options=retry_options)
 
     kwargs = {
@@ -37,11 +37,14 @@ async def _transmit(client_session, url, job_data):
         await client_response.text()
 
 
-async def _handle_result(session, job_data, job, url_template, log_message, is_stream=False): # pylint: disable=too-many-arguments
+# pylint: disable=too-many-arguments, disable=line-too-long
+async def _handle_result(session: ClientSession, job_data, job, url_template, log_message, is_stream=False):
     """
     A helper function to handle the result, either for sending or streaming.
     """
     try:
+        session.headers["X-Request-ID"] = job["id"]
+
         serialized_job_data = json.dumps(job_data, ensure_ascii=False)
 
         is_stream = "true" if is_stream else "false"
@@ -50,7 +53,7 @@ async def _handle_result(session, job_data, job, url_template, log_message, is_s
         await _transmit(session, url, serialized_job_data)
         log.debug(f"{log_message}", job['id'])
 
-    except aiohttp.ClientError as err:
+    except ClientError as err:
         log.error(f"Failed to return job results. | {err}", job['id'])
 
     except (TypeError, RuntimeError) as err:
 
@@ -10,8 +10,8 @@
 import json
 import asyncio
 import traceback
-from aiohttp import ClientSession
 
+from runpod.http_client import ClientSession
 from runpod.serverless.modules.rp_logger import RunPodLogger
 from .worker_state import WORKER_ID, Jobs
 from .rp_tips import check_return_size
@@ -43,10 +43,8 @@ async def get_job(session: ClientSession, retry=True) -> Optional[Dict[str, Any]
     Will continue trying to get a job until one is available.
 
     Args:
-        session (ClientSession): The aiohttp ClientSession to use for the request.
+        session (ClientSession): The async http client to use for the request.
         retry (bool): Whether to retry if no job is available.
-
-    Note: Retry True just for ease of, if testing improved this can be removed.
     """
     next_job = None
 
@@ -106,7 +104,7 @@ async def get_job(session: ClientSession, retry=True) -> Optional[Dict[str, Any]
             if retry is False:
                 break
 
-        await asyncio.sleep(0)
+        await asyncio.sleep(1)
     else:
         job_list.add_job(next_job["id"])
         log.debug("Request ID added.", next_job['id'])
 
@@ -16,7 +16,7 @@
 
 
 MAX_MESSAGE_LENGTH = 4096
-LOG_LEVELS = ['NOTSET', 'DEBUG', 'INFO', 'WARN', 'ERROR']
+LOG_LEVELS = ['NOTSET', 'DEBUG', 'TRACE', 'INFO', 'WARN', 'ERROR']
 
 
 def _validate_log_level(log_level):
@@ -32,7 +32,7 @@ def _validate_log_level(log_level):
         return log_level
 
     if isinstance(log_level, int):
-        if log_level < 0 or log_level > 4:
+        if log_level < 0 or log_level >= len(LOG_LEVELS):
             raise ValueError(f'Invalid debug level: {log_level}')
 
         return LOG_LEVELS[log_level]
@@ -134,3 +134,9 @@ def tip(self, message):
         tip log
         '''
         self.log(message, 'TIP')
+
+    def trace(self, message, request_id: Optional[str] = None):
+        '''
+        trace log (buffered until flushed)
+        '''
+        self.log(message, 'TRACE', request_id)