forked from apache/datafusion-ballista
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathupdate_datafusion_versions.py
executable file
·120 lines (96 loc) · 4.01 KB
/
update_datafusion_versions.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
#!/usr/bin/env python
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# Script that updates verions for datafusion crates, locally
#
# dependencies:
# pip install tomlkit
import re
import os
import argparse
from pathlib import Path
import tomlkit
crates = {
'datafusion': 'datafusion/core/Cargo.toml',
'datafusion-cli': 'datafusion-cli/Cargo.toml',
'datafusion-common': 'datafusion/common/Cargo.toml',
'datafusion-data-access': 'datafusion/data-access/Cargo.toml',
'datafusion-expr': 'datafusion/expr/Cargo.toml',
'datafusion-jit': 'datafusion/jit/Cargo.toml',
'datafusion-physical-expr': 'datafusion/physical-expr/Cargo.toml',
'datafusion-proto': 'datafusion/proto/Cargo.toml',
'datafusion-row': 'datafusion/row/Cargo.toml'
}
ballista_crates = {
'ballista-cli': 'ballista-cli/Cargo.toml',
'core': 'ballista/core/Cargo.toml',
'client': 'ballista/client/Cargo.toml',
'executor': 'ballista/executor/Cargo.toml',
'scheduler': 'ballista/scheduler/Cargo.toml',
}
def update_datafusion_version(cargo_toml: str, new_version: str):
print(f'updating {cargo_toml}')
with open(cargo_toml) as f:
data = f.read()
doc = tomlkit.parse(data)
doc.get('package')['version'] = new_version
with open(cargo_toml, 'w') as f:
f.write(tomlkit.dumps(doc))
def update_downstream_versions(cargo_toml: str, new_version: str):
with open(cargo_toml) as f:
data = f.read()
doc = tomlkit.parse(data)
for crate in crates.keys():
df_dep = doc.get('dependencies', {}).get(crate)
# skip crates that pin datafusion using git hash
if df_dep is not None and df_dep.get('version') is not None:
print(f'updating {crate} dependency in {cargo_toml}')
df_dep['version'] = new_version
df_dep = doc.get('dev-dependencies', {}).get(crate)
if df_dep is not None and df_dep.get('version') is not None:
print(f'updating {crate} dev-dependency in {cargo_toml}')
df_dep['version'] = new_version
with open(cargo_toml, 'w') as f:
f.write(tomlkit.dumps(doc))
def update_docs(path: str, new_version: str):
print(f"updating docs in {path}")
with open(path, 'r+') as fd:
content = fd.read()
fd.seek(0)
content = re.sub(r'datafusion = "(.+)"', f'datafusion = "{new_version}"', content)
fd.write(content)
def main():
parser = argparse.ArgumentParser(
description=(
'Update datafusion crate version and corresponding version pins '
'in downstream crates.'
))
parser.add_argument('new_version', type=str, help='new datafusion version')
args = parser.parse_args()
new_version = args.new_version
repo_root = Path(__file__).parent.parent.absolute()
print(f'Updating datafusion crate versions in {repo_root} to {new_version}')
for cargo_toml in crates.values():
update_datafusion_version(cargo_toml, new_version)
print(f'Updating datafusion dependency versions in {repo_root} to {new_version}')
for cargo_toml in crates.values():
update_downstream_versions(cargo_toml, new_version)
for cargo_toml in ballista_crates.values():
update_downstream_versions(cargo_toml, new_version)
update_docs("README.md", new_version)
if __name__ == "__main__":
main()