reductstore · atimin · Oct 2, 2023 · Oct 1, 2023 · Oct 2, 2023 · Oct 2, 2023
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -7,6 +7,11 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## [Unreleased]
 
+
+### Added:
+
+- Support for ReductStore HTTP API v1.7, see `Bucket.write_batch` method, [PR-95](https://github.com/reductstore/reduct-py/pull/95)
+
 ### Changed:
 
 - Update dependencies and migrate to Pydantic v2, [PR-94](https://github.com/reductstore/reduct-py/pull/94)

diff --git a/README.md b/README.md
@@ -8,12 +8,12 @@ This package provides an asynchronous HTTP client for interacting with the [Redu
 
 ## Features
 
-* Supports the [ReductStore HTTP API v1.6](https://docs.reduct.store/http-api)
+* Supports the [ReductStore HTTP API v1.7](https://docs.reduct.store/http-api)
 * Bucket management
 * API Token management
 * Write, read and query data
 * Labels
-* Batching records
+* Batching records for read and write operations
 * Subscription on new data
 
 ## Install

diff --git a/reduct/bucket.py b/reduct/bucket.py
@@ -9,12 +9,21 @@
     List,
     AsyncIterator,
     Union,
+    Dict,
 )
 
 from pydantic import BaseModel
 
+from reduct.error import ReductError
 from reduct.http import HttpClient
-from reduct.record import Record, parse_batched_records, parse_record
+from reduct.record import (
+    Record,
+    parse_batched_records,
+    parse_record,
+    Batch,
+    TIME_PREFIX,
+    ERROR_PREFIX,
+)
 
 
 class QuotaType(Enum):
@@ -58,6 +67,9 @@ class BucketInfo(BaseModel):
     latest_record: int
     """UNIX timestamp of the latest record in microseconds"""
 
+    is_provisioned: bool = False
+    """bucket is provisioned amd you can't remove it or change its settings"""
+
 
 class EntryInfo(BaseModel):
     """Entry of bucket"""
@@ -231,6 +243,53 @@ async def write(
             **kwargs,
         )
 
+    async def write_batch(
+        self, entry_name: str, batch: Batch
+    ) -> Dict[int, ReductError]:
+        """
+        Write a batch of records to entries in a sole request
+
+        Args:
+            entry_name: name of entry in the bucket
+            batch: list of records
+        Returns:
+            dict of errors with timestamps as keys
+        Raises:
+            ReductError: if there is an HTTP  or communication error
+        """
+
+        record_headers = {}
+        content_length = 0
+        for time_stamp, record in batch.items():
+            content_length += record.size
+            header = f"{record.size},{record.content_type}"
+            for label, value in record.labels.items():
+                if "," in label or "=" in label:
+                    header += f',{label}="{value}"'
+                else:
+                    header += f",{label}={value}"
+
+            record_headers[f"{TIME_PREFIX}{time_stamp}"] = header
+
+        async def iter_body():
+            for _, rec in batch.items():
+                yield await rec.read_all()
+
+        _, headers = await self._http.request_all(
+            "POST",
+            f"/b/{self.name}/{entry_name}/batch",
+            data=iter_body(),
+            extra_headers=record_headers,
+            content_length=content_length,
+        )
+
+        errors = {}
+        for key, value in headers.items():
+            if key.startswith(ERROR_PREFIX):
+                errors[int(key[len(ERROR_PREFIX) :])] = ReductError.from_header(value)
+
+        return errors
+
     async def query(
         self,
         entry_name: str,
@@ -290,9 +349,8 @@ async def get_full_info(self) -> BucketFullInfo:
         """
         Get full information about bucket (settings, statistics, entries)
         """
-        return BucketFullInfo.parse_raw(
-            await self._http.request_all("GET", f"/b/{self.name}")
-        )
+        body, _ = await self._http.request_all("GET", f"/b/{self.name}")
+        return BucketFullInfo.model_validate_json(body)
 
     async def subscribe(
         self, entry_name: str, start: Optional[int] = None, poll_interval=1.0, **kwargs
@@ -368,7 +426,7 @@ async def _query(self, entry_name, start, stop, ttl, **kwargs):
             params["limit"] = kwargs["limit"]
 
         url = f"/b/{self.name}/{entry_name}"
-        data = await self._http.request_all(
+        data, _ = await self._http.request_all(
             "GET",
             f"{url}/q",
             params=params,

diff --git a/reduct/client.py b/reduct/client.py
@@ -70,6 +70,9 @@ class Token(BaseModel):
     created_at: datetime
     """creation time of token"""
 
+    is_provisioned: bool = False
+    """token is provisioned and can't be deleted or changed"""
+
 
 class FullTokenInfo(Token):
     """Full information about token with permissions"""
@@ -137,7 +140,8 @@ async def info(self) -> ServerInfo:
         Raises:
             ReductError: if there is an HTTP error
         """
-        return ServerInfo.parse_raw(await self._http.request_all("GET", "/info"))
+        body, _ = await self._http.request_all("GET", "/info")
+        return ServerInfo.model_validate_json(body)
 
     async def list(self) -> List[BucketInfo]:
         """
@@ -148,9 +152,8 @@ async def list(self) -> List[BucketInfo]:
         Raises:
             ReductError: if there is an HTTP error
         """
-        return BucketList.parse_raw(
-            await self._http.request_all("GET", "/list")
-        ).buckets
+        body, _ = await self._http.request_all("GET", "/list")
+        return BucketList.model_validate_json(body).buckets
 
     async def get_bucket(self, name: str) -> Bucket:
         """
@@ -184,7 +187,7 @@ async def create_bucket(
         Raises:
             ReductError: if there is an HTTP error
         """
-        data = settings.json() if settings else None
+        data = settings.model_dump_json() if settings else None
         try:
             await self._http.request_all("POST", f"/b/{name}", data=data)
         except ReductError as err:
@@ -201,9 +204,8 @@ async def get_token_list(self) -> List[Token]:
         Raises:
             ReductError: if there is an HTTP error
         """
-        return TokenList.parse_raw(
-            await self._http.request_all("GET", "/tokens")
-        ).tokens
+        body, _ = await self._http.request_all("GET", "/tokens")
+        return TokenList.model_validate_json(body).tokens
 
     async def get_token(self, name: str) -> FullTokenInfo:
         """
@@ -215,9 +217,8 @@ async def get_token(self, name: str) -> FullTokenInfo:
         Raises:
             ReductError: if there is an HTTP error
         """
-        return FullTokenInfo.parse_raw(
-            await self._http.request_all("GET", f"/tokens/{name}")
-        )
+        body, _ = await self._http.request_all("GET", f"/tokens/{name}")
+        return FullTokenInfo.model_validate_json(body)
 
     async def create_token(self, name: str, permissions: Permissions) -> str:
         """
@@ -230,11 +231,10 @@ async def create_token(self, name: str, permissions: Permissions) -> str:
         Raises:
             ReductError: if there is an HTTP error
         """
-        return TokenCreateResponse.parse_raw(
-            await self._http.request_all(
-                "POST", f"/tokens/{name}", data=permissions.json()
-            )
-        ).value
+        body, _ = await self._http.request_all(
+            "POST", f"/tokens/{name}", data=permissions.model_dump_json()
+        )
+        return TokenCreateResponse.model_validate_json(body).value
 
     async def remove_token(self, name: str) -> None:
         """
@@ -254,4 +254,5 @@ async def me(self) -> FullTokenInfo:
         Raises:
             ReductError: if there is an HTTP error
         """
-        return FullTokenInfo.parse_raw(await self._http.request_all("GET", "/me"))
+        body, _ = await self._http.request_all("GET", "/me")
+        return FullTokenInfo.model_validate_json(body)
diff --git a/reduct/error.py b/reduct/error.py
@@ -9,6 +9,14 @@ def __init__(self, code: int, message: str):
         self._message = message
         super().__init__(f"Status {self._code}: {self.message}")
 
+    @staticmethod
+    def from_header(header: str) -> "ReductError":
+        """Create ReductError from HTTP header
+        with status code and message (batched write
+        )"""
+        status_code, message = header.split(",", 1)
+        return ReductError(int(status_code), message)
+
     @property
     def status_code(self):
         """Return HTTP status code"""
@@ -18,3 +26,6 @@ def status_code(self):
     def message(self):
         """Return error message"""
         return self._message
+
+    def __eq__(self, other: "ReductError"):
+        return self._code == other._code and self._message == other._message
diff --git a/reduct/http.py b/reduct/http.py
@@ -42,7 +42,7 @@ async def request(
     ) -> AsyncIterator[ClientResponse]:
         """HTTP request with ReductError exception"""
 
-        extra_headers = {}
+        extra_headers = kwargs.pop("extra_headers", {})
         expect100 = False
 
         if "content_length" in kwargs:
@@ -112,10 +112,26 @@ async def _request(
                 599, f"Connection failed, server {self._url} cannot be reached"
             ) from None
 
-    async def request_all(self, method: str, path: str = "", **kwargs) -> bytes:
-        """Http request"""
+    async def request_all(
+        self, method: str, path: str = "", **kwargs
+    ) -> (bytes, Dict[str, str]):
+        """Http request
+        Args:
+            method (str): HTTP method
+            path (str, optional): Path. Defaults to "".
+            **kwargs: kwargs for aiohttp.request
+        Kwargs:
+            data (bytes | AsyncIterator[bytes): request body
+            extra_headers (Dict[str, str]): extra headers
+            content_length (int): content length
+        Returns:
+            bytes: response body
+            Dict[str, str]: response headers
+        Raises:
+            ReductError: if request failed
+        """
         async with self.request(method, path, **kwargs) as response:
-            return await response.read()
+            return await response.read(), response.headers
 
     async def request_chunked(
         self, method: str, path: str = "", chunk_size=1024, **kwargs

diff --git a/reduct/record.py b/reduct/record.py
@@ -2,7 +2,7 @@
 import asyncio
 from dataclasses import dataclass
 from functools import partial
-from typing import Dict, Callable, AsyncIterator, Awaitable
+from typing import Dict, Callable, AsyncIterator, Awaitable, Optional, List, Tuple
 
 from aiohttp import ClientResponse
 
@@ -28,7 +28,57 @@ class Record:
     """labels of record"""
 
 
+class Batch:
+    """Batch of records to write them in one request"""
+
+    def __init__(self):
+        self._records: Dict[int, Record] = {}
+
+    def add(
+        self,
+        timestamp: int,
+        data: bytes,
+        content_type: Optional[str] = None,
+        labels: Optional[Dict[str, str]] = None,
+    ):
+        """Add record to batch
+        Args:
+            timestamp: UNIX timestamp in microseconds
+            data: data to store
+            content_type: content type of data (default: application/octet-stream)
+            labels: labels of record (default: {})
+        """
+        if content_type is None:
+            content_type = "application/octet-stream"
+        if labels is None:
+            labels = {}
+
+        def read(n: int) -> AsyncIterator[bytes]:
+            raise NotImplementedError()
+
+        async def read_all():
+            return data
+
+        record = Record(
+            timestamp=timestamp,
+            size=len(data),
+            content_type=content_type,
+            labels=labels,
+            read_all=read_all,
+            read=read,
+            last=False,
+        )
+
+        self._records[timestamp] = record
+
+    def items(self) -> List[Tuple[int, Record]]:
+        """Get records as dict items"""
+        return sorted(self._records.items())
+
+
 LABEL_PREFIX = "x-reduct-label-"
+TIME_PREFIX = "x-reduct-time-"
+ERROR_PREFIX = "x-reduct-error-"
 CHUNK_SIZE = 512_000
 
 
@@ -109,14 +159,12 @@ async def _read_all(buffer):
 async def parse_batched_records(resp: ClientResponse) -> AsyncIterator[Record]:
     """Parse batched records from response"""
 
-    records_total = sum(
-        1 for header in resp.headers if header.startswith("x-reduct-time-")
-    )
+    records_total = sum(1 for header in resp.headers if header.startswith(TIME_PREFIX))
     records_count = 0
     head = resp.method == "HEAD"
 
     for name, value in resp.headers.items():
-        if name.startswith("x-reduct-time-"):
+        if name.startswith(TIME_PREFIX):
             timestamp = int(name[14:])
             content_length, content_type, labels = _parse_header_as_csv_row(value)