From e79d0bcb2d257b4f27bd0eb32ccb6c30c4c4d810 Mon Sep 17 00:00:00 2001 From: alex Date: Mon, 2 Dec 2024 18:02:13 +0100 Subject: [PATCH 1/4] Changes: - split up connections and transactions - update docs --- docs/connections-and-transactions.md | 381 ++++----------------------- docs/database.md | 275 +++++++++++++++++++ docs/databasez-people.md | 8 +- docs/extra-drivers-and-overwrites.md | 90 +++++++ docs/integrations.md | 46 +++- mkdocs.yml | 2 + 6 files changed, 454 insertions(+), 348 deletions(-) create mode 100644 docs/database.md create mode 100644 docs/extra-drivers-and-overwrites.md diff --git a/docs/connections-and-transactions.md b/docs/connections-and-transactions.md index 2c2620d..6ad9756 100644 --- a/docs/connections-and-transactions.md +++ b/docs/connections-and-transactions.md @@ -1,340 +1,81 @@ # Connections and Transactions -Databasez handles database connection pooling and transaction management -with minimal fuss. It'll automatically deal with acquiring and releasing -connections to the pool as needed, and supports a simple transaction API -that transparently handles the use of either transactions or savepoints. +## Connections -## Database +Connections are the heart-piece of databasez. They are enabling rollback behavior, via transactions +and provide all manipulation functions. +Despite there are shortcut methods on the [Database object](./database.md), they are all using +connections internally. +When wanting for performance reasons one connection doing multiple jobs, retrieving a connection via +`connection()` and perform all tasks within the connection context (connections are async contextmanagers) are the way to go. -This is the main object used for the connections and it is a very powerful object. +### Multithreading -```python -from databasez import Database -``` - -**Parameters** - -* **url** - The `url` of the connection string or a Database object to copy from. - - Default: `None` - -* **force_rollback** - An optional boolean flag for force_rollback. Overwritable at runtime possible. - Note: when None it copies the value from the provided Database object or sets it to False. - - Default: `None` - -* **full_isolation** - Special mode for using force_rollback with nested queries. This parameter fully isolates the global connection - in an extra thread. This way it is possible to use blocking operations like locks with force_rollback. - This parameter has no use when used without force_rollback and causes a slightly slower setup (Lock is initialized). - It is required for edgy or other frameworks which use threads in tests and the force_rollback parameter. - - Default: `None` +`sqlalchemy`'s async addon is also multi-threading capable but we cannot use this for two reasons: -* **poll_interval** - When using multithreading, the poll_interval is used to retrieve results from other loops. It defaults to a sane value. +- Only the `NullPool` is supported which is afaik just no pooling. +- No global connection which is reliable resetted would be possible. - Default: `None` +Therefor `databasez` uses an other approach: `isolation`: -* **config** - A python like dictionary as alternative to the `url` that contains the information -to connect to the database. +Event-loops are per thread. So in this approach for every new event-loop detected the database object is copied and assigned to it. +This way all connections are running in a per-thread pool. The global connection is a bit different from the rest. +Whenever it is accessed by an other thread, asyncio.run_coroutine_threadsafe is used. +In the full-isolation mode (default) the global connection is even moved to an own thread. - Default: `None` +### Self-resetting global connection -* **options** - Any other configuration. The classic `kwargs`. +Sometimes, especially for tests, you want a connection in which all changes are resetted when the database is closed. +For having this reliable, a global connection is lazily initialized when requested on the database object via the +`force_rollback` contextmanager/parameter/pseudo-attribute. -!!! Warning - Be careful when setting up the `url` or `config`. You can use one or the other but not both - at the same time. +Whenever `connection()` is called, the same global connection is returned. It behaves nearly normally except you have just one connection +available. +This means you have to be careful when using `iterate` to not open another connection via `connection` (except you set `force_rollback` to False before opening the connection). +Otherwise it will deadlock. -!!! Warning - `full_isolation` is not mature and shouldn't be used in production code. +## Transactions -**Attributes*** +Transactions are lazily initialized. You dont't need a connected database to create them via `database.transaction()`. -* **force_rollback**: - It evaluates its trueness value to the active value of force_rollback for this context. - You can delete it to reset it (`del database.force_rollback`) (it uses the descriptor magic). +When created, there are three ways to activate the Transaction -**Functions** +1. The async context manager way via `async with transaction: ...` +2. Entering a method decorated with a transaction. +3. The manual way via `await transaction` -* **__copy__** - Either usable directly or via copy from the copy module. A fresh Database object with the same options as the existing is created. - Note: for creating a copy with overwritten initial force_rollback you can use: `Database(database_obj, force_rollback=False)`. - Note: you have to connect it. +Whenever the transaction is activated, a connected database is required. -* **force_rollback(force_rollback=True)**: - The magic attribute is also function returning a context-manager for temporary overwrites of force_rollback. +A second way to get a transaction is via the `Connection`. It has also a `transaction()` method. -* **asgi** - ASGI lifespan interception shim. -## Connecting and disconnecting +### The three ways to use a transaction -You can control the database connection, by using it as a async context manager. +#### Via the async context manager protocol ```python -async with Database(DATABASE_URL) as database: +async with database.transaction(): ... ``` - -Or by using explicit `.connect()` and `disconnect()`: - -```python -database = Database(DATABASE_URL) - -await database.connect() -... -await database.disconnect() -``` - -If you're integrating against a web framework, then you'll probably want -to hook into framework startup or shutdown events. For example, with -[Esmerald][esmerald] you would use the following: - -```python -@app.on_event("startup") -async def startup(): - await database.connect() - -@app.on_event("shutdown") -async def shutdown(): - await database.disconnect() -``` - -Starlette is deprecating the previous way of declaring events in favour of the newly created -`Lifespan`. - -[Esmerald][esmerald] on the other hand, will allow you to continue to use the events in both ways. -Internally Esmerald handles the `on_startup` and `on_shutdown` in a unique and clean way where -it will automatically generate the `Lifespan` events for you. - -!!! Note - Since the author of [Esmerald][esmerald] and [Edgy][edgy] is the same and you would like to - have those same type of events to continue also for Starlette even after the deprecation and without - breaking your code or diverge from Starlette's base, the same author is the creator of - [Starlette Bridge][starlette-bridge] where it was shared the same approach created for Esmerald with - everyone to use with Starlette or any Starlette related project, for example, FastAPI. - - -## Connection options as a string - -The PostgreSQL and MySQL backends provide a few connection options for SSL -and for configuring the connection pool. - -```python -# Use an SSL connection. -database = Database('postgresql+asyncpg://localhost/example?ssl=true') - -# Use an SSL connection and configure pool -database = Database('postgresql+asyncpg://localhost/example?ssl=true&pool_size=20') -``` - -You can also use keyword arguments to pass in any connection options. -Available keyword arguments may differ between database backends. Keywords can be used like in create_async_engine (most are passed through). -This means also the keyword extraction works like in sqlalchemy - -```python -database = Database('postgresql+asyncpg://localhost/example', ssl=True, pool_size=20) -``` - -Note: not all query values are morphed into kwargs arguments. -Options which will be transformed are in `databasez/sqlalchemy.py` in `extract_options` - -Some transformed options are: - -- ssl: enable ssl. -- echo: enable echo. -- echo_pool: enable echo for pool. -- pool_size: maximal amount of connections, int (former name: min_size). -- max_overflow: maximal amount of connections, int (former name: max_size). -- pool_recycle: maximal duration a connection may live, float. -- isolation_level: isolation_level, str. - - -## Connection options as a dictionary - -**Databasez** also provides another way of passing the connection options by using dictionaries. - -For those who are used to other frameworks handling the connections in this way, this was also a -reason why this was also added. - -Databasez expects a python dictionary like object with the following structure. - -```python - -"connection": { - "credentials": { - "scheme": 'sqlite', "postgres" ... - "host": ..., - "port": ..., - "user": ..., - "password": ..., - "database": ..., - "options": { # only query - "driver": ... # In case of MSSQL - "ssl": ... - } - } -} -``` - -When a python dictionary like is passed into the `Database` object, then the `config` parameter -needs to be set. - -```python -from databasez import Database - -CONFIG = { - "connection": { - "credentials": { - "scheme": 'sqlite', "postgres" ... - "host": ..., - "port": ..., - "user": ..., - "password": ..., - "database": ..., - "options": { - "driver": ... # In case of MSSQL - "ssl": ... - } - } - } -} - -database = Database(config=CONFIG) -``` - -The `options` **is everything else that should go in the query parameters, meaning, after the `?`** - -### Normal cases - -Let us see an example. Let us assume we have a database with the following: - -* Type: `postgres` -* Database name: `my_db` -* User: `postgres` -* Password: `password` -* Port: `5432` -* Host: `localhost` - -This would look like this: - -```python -{! ../docs_src/connections/as_dict.py!} -``` - -This is the equivalent to: - -```shell -postgresql+asyncpg://postgres:password@localhost:5432/my_db -``` - -### A more complex example - -Let us now use an example using `MSSQL` which usually requires more options to be passed. - -* Type: `mssql` -* Database name: `master` -* User: `sa` -* Password: `Mssql123mssql-` -* Port: `1433` -* Host: `localhost` - -This would look like this: +It can also be acquired from a specific database connection: ```python -{! ../docs_src/connections/mssql.py!} -``` - -This is the equivalent to: - -```shell -mssql+aioodbc://sa:Mssql123mssql-@localhost:1433/master?driver=ODBC+Driver+17+for+SQL+Server +async with database.connection() as connection: + async with connection.transaction(): + ... ``` -!!! Note - As you can see, Databasez offers some other ways of achieving the same results and offers - multiple forms of creating a [Database](#database) object. - -## JDBC - -Databasez injects a jdbc driver. You can use it as simple as: - -`jdbc+jdbc-dsn-driver-name://dsn?jdbc_driver=?` - -or for modern jdbc drivers - -`jdbc+jdbc-dsn-driver-name://dsn` - -Despite the jdbc-dsn-driver-name is not known by sqlalchemy this works. The overwrites rewrite the URL for sqlalchemy. - - -!!! Warning - It seems like injecting classpathes in a running JVM doesn't work properly. If you have more then one jdbc driver, - make sure all classpathes are specified. - - -!!! Warning - The jdbc driver doesn't support setting the isolation_level yet (this is highly db vendor specific). - -### Parameters - -The jdbc driver supports some extra parameters which will be removed from the query (note: most of them can be also passed via keywords) - -* **jdbc_driver** - import path of the jdbc driver (java format). Required for old jdbc drivers. -* **jdbc_driver_args** - additional keyword arguments for the driver. Note: they must be passed in json format. Query only parameter. -* **jdbc_dsn_driver** - Not really required because of the rewrite but if the url only specifies jdbc:// withouth the dsn driver you can set it here manually. - -### Direct-only parameters - -These parameters are directly set in database as keywords and have no DSN conversion. - -* **transform_reflected_names** - Because JDBC drivers (especially old) do strange name mangling we may need this parameter. - It has 3 possible values: "upper", "lower", "none" (default). When upper or lower is used, all names are converted in this case. - This is required for ancient sqlite jdbc drivers. -* **use_code_datatype** - When True the java code type is evaluated instead of parsing the SQL string datatype. By default False. - -## dbapi2 - - -Databasez injects a dbapi2 driver. You can use it as simple as: - -`dbapi2+foo://dsn` - -or simply - -`dbapi2://dsn` - -!!! Warning - The dbapi2 driver doesn't support setting the isolation_level yet (this is highly db vendor specific). - -### Parameters - -The dbapi2 driver supports some extra parameters which will be removed from the query (note: most of them can be also passed via keywords) - -* **dbapi_driver_args** - additional keyword arguments for the driver. Note: they must be passed in json format. Query only parameter. -* **dbapi_dsn_driver** - If required it is possible to set the dsn driver here. Normally it should work without. You can use the same trick like in jdbc to provide a dsn driver. -* **dbapi_pool** - thread/process. Default: thread. How the dbapi2. is isolated. Either via ProcessPool or ThreadPool (with one worker). -* **dbapi_force_async_wrapper** - bool/None. Default: None. Figure out if the async_wrapper is required. By setting a bool the wrapper can be enforced or removed. +#### Via decorating -The dbapi2 has some extra options which cannot be passed via the url, some of them are required: - -* **dbapi_path** - Import path of the dbapi2 module. Required - -## Transactions - -Transactions are managed by async context blocks. - -A transaction can be acquired from the database connection pool: +You can also use `.transaction()` as a function decorator on any async function: ```python -async with database.transaction(): +@database.transaction() +async def create_users(request): ... ``` -It can also be acquired from a specific database connection: -```python -async with database.connection() as connection: - async with connection.transaction(): - ... -``` +#### Manually For a lower-level transaction API: @@ -348,13 +89,7 @@ else: await transaction.commit() ``` -You can also use `.transaction()` as a function decorator on any async function: - -```python -@database.transaction() -async def create_users(request): - ... -``` +### Advanced operations The state of a transaction is liked to the connection used in the currently executing async task. If you would like to influence an active transaction from another task, the connection must be @@ -408,29 +143,3 @@ async with databases.Database(database_url) as db: async with database.transaction(isolation_level="serializable"): ... ``` - -## Reusing sqlalchemy engine of databasez - -For integration in other libraries databasez has also the AsyncEngine exposed via the `engine` property. -If a database is connected you can retrieve the engine from there. - -## Debugging (multithreading) - -Sometimes there is a lockup. To get of the underlying issues, you can set - -`databasez.utils.DATABASEZ_RESULT_TIMEOUT` to a positive float/int value. - -This way lockups will raise an exception. - - -## Special jdbc/dbapi2 stuff - -Currently there is not much documentation and you have to check the overwrites and dialects yourself to get an idea how it works. -Additional there is a jdbc test with a really old sqlite jdbc jar so you may get an idea how it works. - -However it is planned to update the documentation. - -[esmerald]: https://github.com/dymmond/esmerald -[edgy]: https://github.com/dymmond/edgy -[saffier]: https://github.com/tarsil/saffier -[starlette-bridge]: https://github.com/tarsil/starlette-bridge diff --git a/docs/database.md b/docs/database.md new file mode 100644 index 0000000..9b33d46 --- /dev/null +++ b/docs/database.md @@ -0,0 +1,275 @@ +# Connection and Database + +Databasez handles database connection pooling and transaction management +with minimal fuss. It'll automatically deal with acquiring and releasing +connections to the pool as needed, and supports a simple transaction API +that transparently handles the use of either transactions or savepoints. + +## Database + +This is the main object used for the connections and it is a very powerful object. + +```python +from databasez import Database +``` + +**Parameters** + +* **url** - The `url` of the connection string or a Database object to copy from. + + Default: `None` + +* **force_rollback** - An optional boolean flag for force_rollback. Overwritable at runtime possible. + Note: when None it copies the value from the provided Database object or sets it to False. + + Default: `None` + +* **full_isolation** - Special mode for using force_rollback with nested queries. This parameter fully isolates the global connection + in an extra thread. This way it is possible to use blocking operations like locks with force_rollback. + This parameter has no use when used without force_rollback and causes a slightly slower setup (Lock is initialized). + It is required for edgy or other frameworks which use threads in tests and the force_rollback parameter. + + Default: `None` + +* **poll_interval** - When using multithreading, the poll_interval is used to retrieve results from other loops. It defaults to a sane value. + + Default: `None` + +* **config** - A python like dictionary as alternative to the `url` that contains the information +to connect to the database. + + Default: `None` + +* **options** - Any other configuration. The classic `kwargs`. + +!!! Warning + Be careful when setting up the `url` or `config`. You can use one or the other but not both + at the same time. + +!!! Warning + `full_isolation` is not mature and shouldn't be used in production code. + +**Attributes*** + +* **force_rollback**: + It evaluates its trueness value to the active value of force_rollback for this context. + You can delete it to reset it (`del database.force_rollback`) (it uses the descriptor magic). + +**Functions** + +* **__copy__** - Either usable directly or via copy from the copy module. A fresh Database object with the same options as the existing is created. + Note: for creating a copy with overwritten initial force_rollback you can use: `Database(database_obj, force_rollback=False)`. + Note: you have to connect it. + +* **force_rollback(force_rollback=True)**: - The magic attribute is also function returning a context-manager for temporary overwrites of force_rollback. + +* **asgi** - ASGI lifespan interception shim. + +## Connecting and disconnecting + +You can control the database connection, by using it as a async context manager. + +```python +async with Database(DATABASE_URL) as database: + ... +``` + +Or by using explicit `.connect()` and `disconnect()`: + +```python +database = Database(DATABASE_URL) + +await database.connect() +... +await database.disconnect() +``` + +If you're integrating against a web framework, then you'll probably want +to hook into framework startup or shutdown events. For example, with +[Esmerald][esmerald] you could use the following: + +```python +{!> ../docs_src/integrations/django.py !} +``` + +In django/ +## Connection options as a string + +The PostgreSQL and MySQL backends provide a few connection options for SSL +and for configuring the connection pool. + +```python +# Use an SSL connection. +database = Database('postgresql+asyncpg://localhost/example?ssl=true') + +# Use an SSL connection and configure pool +database = Database('postgresql+asyncpg://localhost/example?ssl=true&pool_size=20') +``` + +You can also use keyword arguments to pass in any connection options. +Available keyword arguments may differ between database backends. Keywords can be used like in create_async_engine (most are passed through). +This means also the keyword extraction works like in sqlalchemy + +```python +database = Database('postgresql+asyncpg://localhost/example', ssl=True, pool_size=20) +``` + +Note: not all query values are morphed into kwargs arguments. +Options which will be transformed are in `databasez/sqlalchemy.py` in `extract_options` + +Some transformed options are: + +- ssl: enable ssl. +- echo: enable echo. +- echo_pool: enable echo for pool. +- pool_size: maximal amount of connections, int (former name: min_size). +- max_overflow: maximal amount of connections, int (former name: max_size). +- pool_recycle: maximal duration a connection may live, float. +- isolation_level: isolation_level, str. + + +## Connection options as a dictionary + +**Databasez** also provides another way of passing the connection options by using dictionaries. + +For those who are used to other frameworks handling the connections in this way, this was also a +reason why this was also added. + +Databasez expects a python dictionary like object with the following structure. + +```python + +"connection": { + "credentials": { + "scheme": 'sqlite', "postgres" ... + "host": ..., + "port": ..., + "user": ..., + "password": ..., + "database": ..., + "options": { # only query + "driver": ... # In case of MSSQL + "ssl": ... + } + } +} +``` + +When a python dictionary like is passed into the `Database` object, then the `config` parameter +needs to be set. + +```python +from databasez import Database + +CONFIG = { + "connection": { + "credentials": { + "scheme": 'sqlite', "postgres" ... + "host": ..., + "port": ..., + "user": ..., + "password": ..., + "database": ..., + "options": { + "driver": ... # In case of MSSQL + "ssl": ... + } + } + } +} + +database = Database(config=CONFIG) +``` + +The `options` **is everything else that should go in the query parameters, meaning, after the `?`** + +### Normal cases + +Let us see an example. Let us assume we have a database with the following: + +* Type: `postgres` +* Database name: `my_db` +* User: `postgres` +* Password: `password` +* Port: `5432` +* Host: `localhost` + +This would look like this: + +```python +{! ../docs_src/connections/as_dict.py!} +``` + +This is the equivalent to: + +```shell +postgresql+asyncpg://postgres:password@localhost:5432/my_db +``` + +### A more complex example + +Let us now use an example using `MSSQL` which usually requires more options to be passed. + +* Type: `mssql` +* Database name: `master` +* User: `sa` +* Password: `Mssql123mssql-` +* Port: `1433` +* Host: `localhost` + +This would look like this: + +```python +{! ../docs_src/connections/mssql.py!} +``` + +This is the equivalent to: + +```shell +mssql+aioodbc://sa:Mssql123mssql-@localhost:1433/master?driver=ODBC+Driver+17+for+SQL+Server +``` + +!!! Note + As you can see, Databasez offers some other ways of achieving the same results and offers + multiple forms of creating a [Database](#database) object. + + +## Extra drivers + +Databasez comes with extra drivers and overwrites for existing drivers. +That way some strange defaults of sqlalchemy are smoothed and the DSN analysed for extra parameters +which were keyword only in the original dialect. +This way an integration is easier. + +[Extra drivers and overwrites](./extra-drivers-and-overwrites.md) + +## Connections and Transactions + +Databasez uses enhanced connection objects. They smooth out some API decisions by the sqlalchemy authors +but allow direct access to the sqlalchemy connections too. +So both styles can be mixed. + +Most important is, only when using them as context, operations are guranteed async/multithreading capable when using databasez. + +Further documentation is in: + +[Connections & Transactions](./connections-and-transactions.md) + + +## Reusing sqlalchemy engine of databasez + +For integration in other libraries databasez has also the AsyncEngine exposed via the `engine` property. +If a database is connected you can retrieve the engine from there. +It is however protected, so you can only access it from the same loop. + +## Debugging (multithreading) + +Sometimes there is a lockup. To get of the underlying issues, you can set + +`databasez.utils.DATABASEZ_RESULT_TIMEOUT` to a positive float/int value. + +This way lockups will raise an exception. + +## Links + +[esmerald]: https://github.com/dymmond/esmerald diff --git a/docs/databasez-people.md b/docs/databasez-people.md index 8ba0855..c5fb273 100644 --- a/docs/databasez-people.md +++ b/docs/databasez-people.md @@ -1,9 +1,7 @@ # Databasez People -## The Special Ones +Databasez wouldn't be possible in this way without these people. -Currently there are no special ones but we are hoping this will change soon. +- @devkral (https://github.com/devkral) -## The Legends - -Currently there are no legends but we are hoping this will change soon. + He refactored databasez nearly completely and added JDBC support as well as the mixed async-multithreading support. diff --git a/docs/extra-drivers-and-overwrites.md b/docs/extra-drivers-and-overwrites.md new file mode 100644 index 0000000..0b96320 --- /dev/null +++ b/docs/extra-drivers-and-overwrites.md @@ -0,0 +1,90 @@ +# Extra drivers and overwrites + +## Extra drivers + +### JDBC + +Databasez injects a jdbc driver. You can use it as simple as: + +`jdbc+jdbc-dsn-driver-name://dsn?jdbc_driver=?` + +or for modern jdbc drivers + +`jdbc+jdbc-dsn-driver-name://dsn` + +Despite the jdbc-dsn-driver-name is not known by sqlalchemy this works. The overwrites rewrite the URL for sqlalchemy. + + +!!! Warning + It seems like injecting classpathes in a running JVM doesn't work properly. If you have more then one jdbc driver, + make sure all classpathes are specified. + + +!!! Warning + The jdbc driver doesn't support setting the isolation_level yet (this is highly db vendor specific). + +### Parameters + +The jdbc driver supports some extra parameters which will be removed from the query (note: most of them can be also passed via keywords) + +* **jdbc_driver** - import path of the jdbc driver (java format). Required for old jdbc drivers. +* **jdbc_driver_args** - additional keyword arguments for the driver. Note: they must be passed in json format. Query only parameter. +* **jdbc_dsn_driver** - Not really required because of the rewrite but if the url only specifies jdbc:// withouth the dsn driver you can set it here manually. + +### Direct-only parameters + +These parameters are directly set in database as keywords and have no DSN conversion. + +* **transform_reflected_names** - Because JDBC drivers (especially old) do strange name mangling we may need this parameter. + It has 3 possible values: "upper", "lower", "none" (default). When upper or lower is used, all names are converted in this case. + This is required for ancient sqlite jdbc drivers. +* **use_code_datatype** - When True the java code type is evaluated instead of parsing the SQL string datatype. By default False. + +### dbapi2 + + +Databasez injects a dbapi2 driver. You can use it as simple as: + +`dbapi2+foo://dsn` + +or simply + +`dbapi2://dsn` + +!!! Warning + The dbapi2 driver doesn't support setting the isolation_level yet (this is highly db vendor specific). + +### Parameters + +The dbapi2 driver supports some extra parameters which will be removed from the query (note: most of them can be also passed via keywords) + +* **dbapi_driver_args** - additional keyword arguments for the driver. Note: they must be passed in json format. Query only parameter. +* **dbapi_dsn_driver** - If required it is possible to set the dsn driver here. Normally it should work without. You can use the same trick like in jdbc to provide a dsn driver. +* **dbapi_pool** - thread/process. Default: thread. How the dbapi2. is isolated. Either via ProcessPool or ThreadPool (with one worker). +* **dbapi_force_async_wrapper** - bool/None. Default: None. Figure out if the async_wrapper is required. By setting a bool the wrapper can be enforced or removed. + +The dbapi2 has some extra options which cannot be passed via the url, some of them are required: + +* **dbapi_path** - Import path of the dbapi2 module. Required + +## Overwrites + +Overwrites can improve existing dialects or coexist with extra drivers to add some tricks. +For example dialects having a json_serializer/json_deserializer parameter, have it set to orjson for more performance. + +Overwrites can consist of three components, which must be classes of the name in a module: + +- Database +- Connection +- Transaction + +All of them are independent by default and must inherite from: + +- DatabaseBackend +- ConnectionBackend +- TransactionBackend + +For simplification there are full functional implementations in `databasez.sqlalchemy`. +It is recommended to inherit from there and just adjust the behavior. + +You can have a look in `databasez/overwrites` for examples. diff --git a/docs/integrations.md b/docs/integrations.md index cbc60d6..cd25cde 100644 --- a/docs/integrations.md +++ b/docs/integrations.md @@ -1,12 +1,14 @@ # Integrations +## Application integration + Databasez has several ways to integrate in applications. Mainly recommended are the async contextmanager one and the asgi based. -## AsyncContextManager +### AsyncContextManager The recommended way of manually using databasez is via the async contextmanager protocol. -This way it is ensured that the database is tore down on errors. +This way it is ensured that the database is torn down on errors. Luckily starlette based apps support the lifespan protocol (startup, teardown of an ASGI server) via async contextmanagers. @@ -14,10 +16,11 @@ Luckily starlette based apps support the lifespan protocol (startup, teardown of {!> ../docs_src/integrations/starlette.py !} ``` -Note: This works also in different domains which are not web related. +!!! Note + This works also in different domains which are not web related. -## ASGI +### ASGI This is a lifespan protocol interception shim for ASGI lifespan. Instead of using the lifespan parameter of starlette, it is possible to wrap the ASGI application via the shim. This way databasez intercepts lifespans requests and injects its code. @@ -29,11 +32,40 @@ It is required for ASGI apps without lifespan support like django. {!> ../docs_src/integrations/django.py !} ``` -## Manually +### Manually -Some Server doesn't support the lifespan protocol. E.g. WSGI based servers. Here is an example how to integrate it. -As well as with the AsyncContextManager we are not limitted to web applications. +Some Server doesn't support the lifespan protocol. E.g. WSGI based servers. +As well as with the AsyncContextManager we are not limited to web applications. +For demonstration purposes we use here esmerald with `on_startup` and `on_shutdown` events. ```python {!> ../docs_src/integrations/esmerald.py !} ``` + +!!! Note + Starlette is deprecating the integration via events. + If you like this way and wants to keep it you may can switch to + [Esmerald][esmerald], which continues to support the old way of integration or + to use [Starlette Bridge][starlette-bridge] which enables such behavior and is from + the same author. + [Starlette Bridge][starlette-bridge] works for Starlette and + any Starlette related project, for example, FastAPI. + + +## ORMs + +There are at least two ORMs using databasez: + +- [Edgy][edgy] - A re-development of saffier using pydantic. It is very fast and has more features than saffier. + It is the recommended ORM. +- [Saffier][saffier] - A stable workhorse but most development will happen now in edgy. + +When using edgy, use the helpers of edgy instead of the ones of databasez for integrating in applications. +This way you get all features of edgy's `Registry`. + +## Links + +[edgy]: https://github.com/dymmond/edgy +[saffier]: https://github.com/tarsil/saffier +[esmerald]: https://github.com/dymmond/esmerald +[starlette-bridge]: https://github.com/tarsil/starlette-bridge diff --git a/mkdocs.yml b/mkdocs.yml index 83d00ed..27164f1 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -39,7 +39,9 @@ nav: - Databasez: "index.md" - Integrations: "integrations.md" - Queries: "queries.md" + - Database: "database.md" - Connections & Transactions: "connections-and-transactions.md" + - Extra drivers and overwrites: "extra-drivers-and-overwrites.md" - Test Client: "test-client.md" - Tests & Migrations: "tests-and-migrations.md" - Vendors: "vendors.md" From c742de38d2a94ca1bd07070680c643a09211f80f Mon Sep 17 00:00:00 2001 From: alex Date: Mon, 2 Dec 2024 18:29:35 +0100 Subject: [PATCH 2/4] Changes: - splitout examples in docs_src --- .gitignore | 1 + docs/connections-and-transactions.md | 75 +++++-------------- docs/database.md | 2 +- docs/release-notes.md | 2 +- .../transactions/async_context_connection.py | 12 +++ .../transactions/async_context_database.py | 12 +++ docs_src/transactions/decorating.py | 15 ++++ docs_src/transactions/isolation_level.py | 21 ++++++ docs_src/transactions/manually.py | 15 ++++ docs_src/transactions/nested_transactions.py | 20 +++++ 10 files changed, 117 insertions(+), 58 deletions(-) create mode 100644 docs_src/transactions/async_context_connection.py create mode 100644 docs_src/transactions/async_context_database.py create mode 100644 docs_src/transactions/decorating.py create mode 100644 docs_src/transactions/isolation_level.py create mode 100644 docs_src/transactions/manually.py create mode 100644 docs_src/transactions/nested_transactions.py diff --git a/.gitignore b/.gitignore index cc2b914..8d45587 100644 --- a/.gitignore +++ b/.gitignore @@ -12,3 +12,4 @@ venv/ .idea/ testsuite.sqlite3 test_testsuite.sqlite3 +site diff --git a/docs/connections-and-transactions.md b/docs/connections-and-transactions.md index 6ad9756..cac6620 100644 --- a/docs/connections-and-transactions.md +++ b/docs/connections-and-transactions.md @@ -23,7 +23,7 @@ This way all connections are running in a per-thread pool. The global connection Whenever it is accessed by an other thread, asyncio.run_coroutine_threadsafe is used. In the full-isolation mode (default) the global connection is even moved to an own thread. -### Self-resetting global connection +### Global connection with auto-rollback Sometimes, especially for tests, you want a connection in which all changes are resetted when the database is closed. For having this reliable, a global connection is lazily initialized when requested on the database object via the @@ -49,20 +49,26 @@ Whenever the transaction is activated, a connected database is required. A second way to get a transaction is via the `Connection`. It has also a `transaction()` method. +### Auto-rollback (`force_rollback`) + +Transactions support an keyword parameter named `force_rollback` which default to `False`. +When set to `True` at the end of the transaction a rollback is tried. +This means all changes are undone. + +This is a simpler variant of `force_rollback` of the database object. + + ### The three ways to use a transaction #### Via the async context manager protocol ```python -async with database.transaction(): - ... +{!> ../docs_src/transactions/async_context_database.py !} ``` It can also be acquired from a specific database connection: ```python -async with database.connection() as connection: - async with connection.transaction(): - ... +{!> ../docs_src/transactions/async_context_connection.py !} ``` #### Via decorating @@ -70,9 +76,7 @@ async with database.connection() as connection: You can also use `.transaction()` as a function decorator on any async function: ```python -@database.transaction() -async def create_users(request): - ... +{!> ../docs_src/transactions/decorating.py !} ``` #### Manually @@ -80,16 +84,10 @@ async def create_users(request): For a lower-level transaction API: ```python -transaction = await database.transaction() -try: - ... -except: - await transaction.rollback() -else: - await transaction.commit() +{!> ../docs_src/transactions/manually.py !} ``` -### Advanced operations +### Isolation level The state of a transaction is liked to the connection used in the currently executing async task. If you would like to influence an active transaction from another task, the connection must be @@ -98,48 +96,13 @@ shared: Transaction isolation-level can be specified if the driver backend supports that: ```python -async def add_excitement(connnection: databases.core.Connection, id: int): - await connection.execute( - "UPDATE notes SET text = CONCAT(text, '!!!') WHERE id = :id", - {"id": id} - ) - - -async with Database(database_url) as database: - async with database.transaction(): - # This note won't exist until the transaction closes... - await database.execute( - "INSERT INTO notes(id, text) values (1, 'databases is cool')" - ) - # ...but child tasks can use this connection now! - await asyncio.create_task(add_excitement(database.connection(), id=1)) - - await database.fetch_val("SELECT text FROM notes WHERE id=1") - # ^ returns: "databases is cool!!!" +{!> ../docs_src/transactions/isolation_level.py !} ``` -Nested transactions are fully supported, and are implemented using database savepoints: +### Nested transactions -```python -async with databases.Database(database_url) as db: - async with db.transaction() as outer: - # Do something in the outer transaction - ... - - # Suppress to prevent influence on the outer transaction - with contextlib.suppress(ValueError): - async with db.transaction(): - # Do something in the inner transaction - ... - - raise ValueError('Abort the inner transaction') - - # Observe the results of the outer transaction, - # without effects from the inner transaction. - await db.fetch_all('SELECT * FROM ...') -``` +Nested transactions are fully supported, and are implemented using database savepoints: ```python -async with database.transaction(isolation_level="serializable"): - ... +{!> ../docs_src/transactions/nested_transactions.py !} ``` diff --git a/docs/database.md b/docs/database.md index 9b33d46..2545382 100644 --- a/docs/database.md +++ b/docs/database.md @@ -1,4 +1,4 @@ -# Connection and Database +# Connecting to a database Databasez handles database connection pooling and transaction management with minimal fuss. It'll automatically deal with acquiring and releasing diff --git a/docs/release-notes.md b/docs/release-notes.md index 86f1ebd..745bd2c 100644 --- a/docs/release-notes.md +++ b/docs/release-notes.md @@ -319,5 +319,5 @@ forked from [Encode](https://github.com/encode/databases) with additional featur * SQLAlchemy 2+ integration. * Additonal support for `mssql`. -* [Connection as dict](./connections-and-transactions.md#connection-options-as-a-dictionary). +* [Connection as dict](./database.md#connection-options-as-a-dictionary). * Brings a native test client. diff --git a/docs_src/transactions/async_context_connection.py b/docs_src/transactions/async_context_connection.py new file mode 100644 index 0000000..8ccb39a --- /dev/null +++ b/docs_src/transactions/async_context_connection.py @@ -0,0 +1,12 @@ +from databasez import Database + + +async def main(): + async with Database("") as database, database.connection() as connection: + # do something + async with connection.transaction(): + ... + + # check something and then reset + async with connection.transaction(force_rollback=True): + ... diff --git a/docs_src/transactions/async_context_database.py b/docs_src/transactions/async_context_database.py new file mode 100644 index 0000000..8b24353 --- /dev/null +++ b/docs_src/transactions/async_context_database.py @@ -0,0 +1,12 @@ +from databasez import Database + + +async def main(): + async with Database("") as database: + # do something + async with database.transaction(): + ... + + # check something and then reset + async with database.transaction(force_rollback=True): + ... diff --git a/docs_src/transactions/decorating.py b/docs_src/transactions/decorating.py new file mode 100644 index 0000000..831c43c --- /dev/null +++ b/docs_src/transactions/decorating.py @@ -0,0 +1,15 @@ +from databasez import Database + +database = Database("") + + +@database.transaction() +async def create_users(request): + ... + # do something + + +async def main(): + async with database: + # now the transaction is activated + await create_users() diff --git a/docs_src/transactions/isolation_level.py b/docs_src/transactions/isolation_level.py new file mode 100644 index 0000000..47c21cb --- /dev/null +++ b/docs_src/transactions/isolation_level.py @@ -0,0 +1,21 @@ +import asyncio + +from databasez import Database, core + + +async def add_excitement(connection: core.Connection, id: int): + await connection.execute( + "UPDATE notes SET text = CONCAT(text, '!!!') WHERE id = :id", {"id": id} + ) + + +async with Database("database_url") as database: + async with database.transaction(): + # This note won't exist until the transaction closes... + await database.execute("INSERT INTO notes(id, text) values (1, 'databases is cool')") + # ...but child tasks can use this connection now! + await asyncio.create_task(add_excitement(database.connection(), id=1)) + + async with database.transaction(isolation_level="serializable"): + await database.fetch_val("SELECT text FROM notes WHERE id=1") + # ^ returns: "databases is cool!!!" diff --git a/docs_src/transactions/manually.py b/docs_src/transactions/manually.py new file mode 100644 index 0000000..2b4b817 --- /dev/null +++ b/docs_src/transactions/manually.py @@ -0,0 +1,15 @@ +from databasez import Database + + +async def main(): + async with Database("") as database, database.connection() as connection: + # get the activated transaction + transaction = await connection.transaction() + + try: + # do something + ... + except Exception: + await transaction.rollback() + else: + await transaction.commit() diff --git a/docs_src/transactions/nested_transactions.py b/docs_src/transactions/nested_transactions.py new file mode 100644 index 0000000..0316151 --- /dev/null +++ b/docs_src/transactions/nested_transactions.py @@ -0,0 +1,20 @@ +import contextlib + +import databasez + +async with databasez.Database("database_url") as db: + async with db.transaction() as outer: + # Do something in the outer transaction + ... + + # Suppress to prevent influence on the outer transaction + with contextlib.suppress(ValueError): + async with db.transaction(): + # Do something in the inner transaction + ... + + raise ValueError("Abort the inner transaction") + + # Observe the results of the outer transaction, + # without effects from the inner transaction. + await db.fetch_all("SELECT * FROM ...") From 73a8d7250394f8b17985005be398e8581e3463cc Mon Sep 17 00:00:00 2001 From: alex Date: Mon, 2 Dec 2024 18:40:08 +0100 Subject: [PATCH 3/4] More docs --- docs/connections-and-transactions.md | 27 ++++++++++++------- docs_src/connections/force_rollback.py | 15 +++++++++++ .../force_rollback_transaction.py | 15 +++++++++++ 3 files changed, 48 insertions(+), 9 deletions(-) create mode 100644 docs_src/connections/force_rollback.py create mode 100644 docs_src/transactions/force_rollback_transaction.py diff --git a/docs/connections-and-transactions.md b/docs/connections-and-transactions.md index cac6620..1df41bf 100644 --- a/docs/connections-and-transactions.md +++ b/docs/connections-and-transactions.md @@ -34,6 +34,12 @@ available. This means you have to be careful when using `iterate` to not open another connection via `connection` (except you set `force_rollback` to False before opening the connection). Otherwise it will deadlock. +Example for `force_rollback`: + +```python +{!> ../docs_src/connections/force_rollback.py !} +``` + ## Transactions Transactions are lazily initialized. You dont't need a connected database to create them via `database.transaction()`. @@ -49,15 +55,6 @@ Whenever the transaction is activated, a connected database is required. A second way to get a transaction is via the `Connection`. It has also a `transaction()` method. -### Auto-rollback (`force_rollback`) - -Transactions support an keyword parameter named `force_rollback` which default to `False`. -When set to `True` at the end of the transaction a rollback is tried. -This means all changes are undone. - -This is a simpler variant of `force_rollback` of the database object. - - ### The three ways to use a transaction #### Via the async context manager protocol @@ -87,6 +84,18 @@ For a lower-level transaction API: {!> ../docs_src/transactions/manually.py !} ``` +### Auto-rollback (`force_rollback`) + +Transactions support an keyword parameter named `force_rollback` which default to `False`. +When set to `True` at the end of the transaction a rollback is tried. +This means all changes are undone. + +This is a simpler variant of `force_rollback` of the database object. +```python +{!> ../docs_src/transactions/force_rollback_transaction.py !} +``` + + ### Isolation level The state of a transaction is liked to the connection used in the currently executing async task. diff --git a/docs_src/connections/force_rollback.py b/docs_src/connections/force_rollback.py new file mode 100644 index 0000000..8340e30 --- /dev/null +++ b/docs_src/connections/force_rollback.py @@ -0,0 +1,15 @@ +from databasez import Database + +database = Database("sqlite:///foo.sqlite", force_rollback=True) + + +def test_foo(): + async with database: + ... + # do the tests + # and now everything is rolled back + + async with database: + ... + # do the tests + # and now everything is rolled back again diff --git a/docs_src/transactions/force_rollback_transaction.py b/docs_src/transactions/force_rollback_transaction.py new file mode 100644 index 0000000..8b3155b --- /dev/null +++ b/docs_src/transactions/force_rollback_transaction.py @@ -0,0 +1,15 @@ +from databasez import Database + +database = Database("sqlite:///foo.sqlite") + + +def test_foo(): + async with database: + await database.execute(...) + + async with database.transaction(force_rollback=True): + # this is rolled back + await database.execute(...) + async with database.transaction(force_rollback=False): + ... + # this is saved From cba6ef4803e4f3fe8f6c4c08f4ba6e313983b0e6 Mon Sep 17 00:00:00 2001 From: alex Date: Mon, 2 Dec 2024 18:41:24 +0100 Subject: [PATCH 4/4] ignore export directories --- .gitignore | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index 8d45587..1ade717 100644 --- a/.gitignore +++ b/.gitignore @@ -12,4 +12,5 @@ venv/ .idea/ testsuite.sqlite3 test_testsuite.sqlite3 -site +/site +/dist