File transformation.py of Package ansible-sap-infrastructure
# This Python script updates upstream with downstream customizations before packaging.
# All customizations are defined in separate yaml file.
# List of available customizations:
# - remove_paths - Removes the specified files or directories.
# - remove_lines - Removes lines matching the patterns from the files matching specified glob patterns.
# - replace_text - Replaces text in files matching specified glob patterns.
# - update_yaml_key - Updates a specific key's value in the specified YAML files matching specified glob patterns.
# - append_yaml_list - Appends a new item to a list in the specified YAML files matching specified glob patterns.
# - set_yaml_value - Sets or replaces a specific key's value in the specified YAML files matching specified glob patterns.
# - remove_yaml_list_items - Removes specific items from a list in the specified YAML files matching specified glob patterns.
# Intended use: Executed by spec file during %prep
import os
import shutil
import re
import glob
import argparse
# Requires entry in spec file: BuildRequires: python3-ruamel.yaml
from ruamel.yaml import YAML
yaml = YAML()
yaml.preserve_quotes = True # Preserves quotes
yaml.indent(mapping=2, sequence=4, offset=2) # Preserves indents in yaml
yaml.width = 4096 # Disable ruamel wrapping long lines
def load_config(config_file):
"""Loads the configuration from a YAML file.
"""
with open(config_file, 'r') as f:
return yaml.load(f)
def remove_paths(build_dir, paths):
"""Removes the specified files or directories.
This function iterates through a list of path patterns, finds all matching
files and directories using glob, and removes them. This is useful for
cleaning up a build directory by removing unnecessary files or directories
before packaging.
Args:
build_dir (str): The absolute path to the base directory from which
paths will be removed.
paths (list[str]): A list of path patterns to remove. These paths are
relative to `build_dir` and can include glob patterns (e.g., '*.txt',
'temp/**').
Example:
```yaml
changes:
- type: remove_paths
paths:
- "roles/*/meta/main.yml"
```
"""
for path_pattern in paths:
full_pattern = os.path.join(build_dir, path_pattern)
for item in glob.glob(full_pattern):
relative_path = os.path.relpath(item, build_dir)
if os.path.isdir(item):
print(f"Removed: {relative_path}")
shutil.rmtree(item, ignore_errors=True)
elif os.path.isfile(item):
print(f"Removed: {relative_path}")
os.remove(item)
def remove_lines(build_dir, files_patterns, patterns):
"""Removes lines matching the patterns from the files matching specified glob patterns.
This function finds files matching the given glob patterns and then reads
each file to remove any lines that match any of the specified regular
expression patterns. This is useful for cleaning up documentation or
configuration files by removing obsolete or unwanted content.
Args:
build_dir (str): The absolute path to the base directory where the
files are located.
files_patterns (list[str]): A list of file path patterns to process.
These paths are relative to `build_dir` and support glob
patterns (e.g., 'docs/*.md', 'roles/**/tasks/main.yml').
patterns (list[str]): A list of regular expression patterns. Any line
in the target files that matches one of these patterns will be
removed.
Example:
```yaml
changes:
- type: remove_lines
files:
- "README.md"
- "roles/*/README.md"
patterns:
- "\\[Ansible Lint"
```
"""
for file_pattern in files_patterns:
full_pattern = os.path.join(build_dir, file_pattern)
for file_path in glob.glob(full_pattern):
if os.path.isfile(file_path):
relative_path = os.path.relpath(file_path, build_dir)
with open(file_path, 'r') as f:
lines = f.readlines()
updated_lines = [
line
for line in lines
if not any(re.search(pattern, line) for pattern in patterns)
]
with open(file_path, 'w') as f:
f.writelines(updated_lines)
print(f"Removed lines from: {relative_path}")
def replace_text(build_dir, files_patterns, replacements):
"""Replaces text in files matching specified glob patterns.
This function finds all files matching the given patterns and performs a
series of find-and-replace operations on their content. The 'find'
patterns are treated as regular expressions, allowing for powerful and
flexible text manipulation. This is useful for updating project-wide
values like namespaces, repository URLs, or other boilerplate text.
Args:
build_dir (str): The absolute path to the base directory where the
files are located.
files_patterns (list[str]): A list of file path patterns to process.
These paths are relative to `build_dir` and support glob
patterns (e.g., 'README.md', 'roles/**/*.yml').
replacements (list[dict[str, str]]): A list of replacement rules.
Each rule is a dictionary with two keys:
- 'find': The regular expression pattern to search for.
- 'replace': The string to substitute for each match.
Example:
```yaml
changes:
- type: replace_text
files:
- "galaxy.yml"
replacements:
- { find: "namespace: community", replace: "namespace: suse" }
```
"""
for file_pattern in files_patterns:
full_pattern = os.path.join(build_dir, file_pattern)
for file_path in glob.glob(full_pattern):
if os.path.isfile(file_path):
relative_path = os.path.relpath(file_path, build_dir)
with open(file_path, 'r') as f:
content = f.read()
for replacement in replacements:
content = re.sub(
replacement['find'],
replacement['replace'],
content,
flags=re.MULTILINE,
)
with open(file_path, 'w') as f:
f.write(content)
print(
f"Replaced text {replacement['find']} with {replacement['replace']} in: {relative_path}"
)
def read_yaml_header(file_path):
"""Reads the header of a YAML file (lines before the first '---').
Args:
file_path (str): The path to the YAML file.
Returns:
list: A list of lines representing the header of the YAML file.
"""
header_lines = []
with open(file_path, 'r') as f:
for line in f:
if line.strip() == '---':
header_lines.append(line)
break
header_lines.append(line)
return header_lines
def update_yaml_key(build_dir, files_patterns, key_path, value):
"""Updates a specific key's value in the specified YAML files, preserving the header.
This function finds all YAML files matching the given patterns and updates
the value of a specified key. The key can be nested, using dot notation
for the path (e.g., 'parent.child.key'). If the key or any part of its
path does not exist, it will be created.
The function is designed to preserve YAML formatting, including comments
and indentation, by using `ruamel.yaml` and by explicitly handling
non-YAML headers (lines before the first '---').
Args:
build_dir (str): The absolute path to the base directory where the
YAML files are located.
files_patterns (list[str]): A list of file path patterns to process,
relative to `build_dir`. Supports glob patterns (e.g., 'galaxy.yml',
'roles/**/meta.yml').
key_path (str): The dot-separated path to the key to update
(e.g., 'info.version', 'authors').
value (any): The new value to assign to the key. This can be any
YAML-compatible type (string, list, dictionary, etc.).
Example:
```yaml
changes:
- type: update_yaml_key
files:
- "galaxy.yml"
key: "build_ignore"
value:
- "tests"
```
"""
for file_pattern in files_patterns:
full_pattern = os.path.join(build_dir, file_pattern)
for file_path in glob.glob(full_pattern):
if os.path.exists(file_path):
try:
relative_path = os.path.relpath(file_path, build_dir)
header_lines = read_yaml_header(file_path)
with open(file_path, 'r') as f:
# Skip header lines when loading
for _ in header_lines:
next(f, None)
data = yaml.load(f)
keys = key_path.split('.')
current_level = data
for i, key in enumerate(keys):
if i == len(keys) - 1:
if key not in current_level:
print(
f"Warning: Key '{key_path}' not found in {relative_path}"
)
else:
current_level[key] = value
print(f"Updated key '{key_path}' in: {relative_path}")
else:
if key not in current_level:
current_level[key] = {}
print(
f"Created missing key '{key}' in path '{key_path}' in: {relative_path}"
)
current_level = current_level[key]
with open(file_path, 'w') as f:
f.writelines(header_lines)
yaml.dump(data, f)
except Exception as e:
print(f"Error processing YAML in {relative_path}: {e}")
def append_yaml_list(build_dir, files_patterns, list_key_path, new_item):
"""Appends a new item to a list in the specified YAML files, preserving the header.
This function finds all YAML files matching the given patterns and appends
a new item to a specified list. The list is identified by a dot-separated
key path. If the list or any part of its path does not exist, it will be
created. The function ensures the item is not added if it already exists
in the list, preventing duplicates.
Like other YAML modification functions in this script, it preserves
comments and formatting by using `ruamel.yaml` and handling file headers.
Args:
build_dir (str): The absolute path to the base directory where the
YAML files are located.
files_patterns (list[str]): A list of file path patterns to process,
relative to `build_dir`. Supports glob patterns.
list_key_path (str): The dot-separated path to the list to which the
item will be appended (e.g., 'galaxy_info.platforms').
new_item (any): The item to append to the list. This can be a simple
string or a more complex dictionary.
Example:
```yaml
changes:
- type: append_yaml_list
files:
- "roles/*/meta/main.yml"
list_key: "galaxy_info.platforms"
new_item:
name: "SLES"
versions:
- "15"
```
"""
for file_pattern in files_patterns:
full_pattern = os.path.join(build_dir, file_pattern)
for file_path in glob.glob(full_pattern):
if os.path.exists(file_path):
try:
relative_path = os.path.relpath(file_path, build_dir)
header_lines = read_yaml_header(file_path)
with open(file_path, 'r') as f:
# Skip header lines when loading
for _ in header_lines:
next(f, None)
data = yaml.load(f)
keys = list_key_path.split('.')
current_level = data
for i, key in enumerate(keys):
if i == len(keys) - 1:
if key not in current_level:
current_level[key] = []
print(
f"Created missing list '{list_key_path}' in: {relative_path}"
)
if isinstance(current_level[key], list):
if new_item not in current_level[key]:
current_level[key].append(new_item)
print(
f"Appended item to list '{list_key_path}' in: {relative_path}"
)
else:
print(
f"Item '{new_item}' already exists in list '{list_key_path}' in: {relative_path}"
)
else:
if key not in current_level:
current_level[key] = {}
print(
f"Created missing key '{key}' in path '{list_key_path}' in: {relative_path}"
)
current_level = current_level[key]
with open(file_path, 'w') as f:
f.writelines(header_lines)
yaml.dump(data, f)
except Exception as e:
print(f"Error processing YAML in {relative_path}: {e}")
def set_yaml_value(build_dir, files_patterns, key_path, value):
"""Sets or replaces a specific key's value in the specified YAML files, preserving the header.
This function finds all YAML files matching the given patterns and sets a
specified key to a new value. The key can be nested, using dot notation
for the path (e.g., 'parent.child.key').
Unlike `update_yaml_key`, this function will always set the value. If the
key or any part of its path does not exist, it will be created. This is
useful for overwriting existing values or ensuring a key is present with
a specific value.
Args:
build_dir (str): The absolute path to the base directory where the
YAML files are located.
files_patterns (list[str]): A list of file path patterns to process,
relative to `build_dir`. Supports glob patterns.
key_path (str): The dot-separated path to the key to set or create
(e.g., 'collections', 'info.version').
value (any): The new value to assign to the key. This can be any
YAML-compatible type (string, list, dictionary, etc.).
Example:
```yaml
changes:
- type: set_yaml_value
files:
- "special_actions/*/ansible_requirements.yml"
key: "collections"
value: []
```
"""
for file_pattern in files_patterns:
full_pattern = os.path.join(build_dir, file_pattern)
for file_path in glob.glob(full_pattern):
if os.path.exists(file_path):
relative_path = os.path.relpath(file_path, build_dir)
try:
header_lines = read_yaml_header(file_path)
with open(file_path, 'r') as f:
# Skip header lines when loading
for _ in header_lines:
next(f, None)
data = yaml.load(f)
keys = key_path.split('.')
current_level = data
for i, key in enumerate(keys):
if i == len(keys) - 1:
current_level[key] = value
print(f"Set key '{key_path}' in: {relative_path}")
else:
if key not in current_level:
current_level[key] = {}
print(
f"Created missing key '{key}' in path '{key_path}' in: {relative_path}"
)
current_level = current_level[key]
with open(file_path, 'w') as f:
f.writelines(header_lines)
yaml.dump(data, f)
except Exception as e:
print(f"Error processing YAML in {relative_path}: {e}")
def remove_yaml_list_items(build_dir, files_patterns, list_key_path, items_to_remove):
"""Removes specific items from a list in the specified YAML files.
This function finds all YAML files matching the given glob patterns and
removes specified items from a list within those files. The list is
identified by a dot-separated key path.
Args:
build_dir (str): The absolute path to the base directory where the
YAML files are located.
files_patterns (list[str]): A list of file path patterns to process,
relative to `build_dir`. Supports glob patterns.
list_key_path (str): The dot-separated path to the list from which
items will be removed (e.g., 'collections').
items_to_remove (list[any]): A list of specification items. Any item
in the target list that matches one of these specifications will
be removed.
Example:
```yaml
changes:
- type: remove_yaml_list_items
files:
- "deploy_scenarios/*/ansible_requirements.yml"
list_key: "collections"
items_to_remove:
- name: "community.sap_install"
```
"""
def item_matches(list_item, spec_item):
"""Check if a list item matches a specification item."""
if isinstance(list_item, dict) and isinstance(spec_item, dict):
# For dicts, check if list_item contains all key-value pairs from spec_item.
return all(k in list_item and list_item[k] == v for k, v in spec_item.items())
# For other types (like strings), use simple equality.
return list_item == spec_item
for file_pattern in files_patterns:
full_pattern = os.path.join(build_dir, file_pattern)
for file_path in glob.glob(full_pattern):
if os.path.isfile(file_path):
relative_path = os.path.relpath(file_path, build_dir)
try:
header_lines = read_yaml_header(file_path)
with open(file_path, 'r') as f:
for _ in header_lines:
next(f, None)
data = yaml.load(f)
# Skip if there is nothing to update.
if data is None:
continue
keys = list_key_path.split('.')
current_level = data
modified = False
path_exists = True
for i, key in enumerate(keys):
if not (isinstance(current_level, dict) and key in current_level):
path_exists = False
break
if i < len(keys) - 1:
current_level = current_level[key]
if not path_exists:
print(f"Warning: Path '{list_key_path}' not found in {relative_path}. Skipping.")
continue
list_key = keys[-1]
if isinstance(current_level[list_key], list):
target_list = current_level[list_key]
initial_len = len(target_list)
new_list = [item for item in target_list if not any(item_matches(item, rem_spec) for rem_spec in items_to_remove)]
if len(new_list) < initial_len:
current_level[list_key] = new_list
print(f"Removed {initial_len - len(new_list)} item(s) from list '{list_key_path}' in: {relative_path}")
modified = True
if modified:
with open(file_path, 'w') as f:
f.writelines(header_lines)
yaml.dump(data, f)
except Exception as e:
print(f"Error processing YAML in {relative_path}: {e}")
def main():
"""Main function to load config and apply changes."""
parser = argparse.ArgumentParser(description="Change files in a specified directory based on a configuration file.")
parser.add_argument("--build_dir", help="The path to the build directory where changes will occur." )
parser.add_argument("--config", help="The path to the configuration YAML file (default: config.yaml)." )
args = parser.parse_args()
config_file = args.config
build_dir = args.build_dir
if not os.path.isdir(build_dir):
print(f"Error: Build directory '{build_dir}' does not exist.")
return
config = load_config(config_file)
changes = config.get('changes', [])
for change in changes:
change_type = change.get('type')
if change_type == 'remove_paths':
remove_paths(build_dir, change.get('paths', []))
elif change_type == 'remove_lines':
remove_lines(build_dir, change.get('files', []), change.get('patterns', []))
elif change_type == 'replace_text':
replace_text(build_dir, change.get('files', []), change.get('replacements', []))
elif change_type == 'update_yaml_key':
update_yaml_key(build_dir, change.get('files', []), change.get('key'), change.get('value'))
elif change_type == 'append_yaml_list':
append_yaml_list(build_dir, change.get('files', []), change.get('list_key'), change.get('new_item'))
elif change_type == 'set_yaml_value':
set_yaml_value(build_dir, change.get('files', []), change.get('key'), change.get('value'))
elif change_type == 'remove_yaml_list_items':
remove_yaml_list_items(build_dir, change.get('files', []), change.get('list_key'), change.get('items_to_remove'))
else:
print(f"Unknown changes type: {change['type']}")
if __name__ == "__main__":
main()