mirror of
https://github.com/msberends/AMR.git
synced 2025-07-12 17:01:57 +02:00
(v2.1.1.9102) fix sir
This commit is contained in:
62
data-raw/_generate_GPT_knowledge_input.sh
Normal file
62
data-raw/_generate_GPT_knowledge_input.sh
Normal file
@ -0,0 +1,62 @@
|
||||
#!/bin/bash
|
||||
|
||||
# Check if the current directory is named 'AMR'
|
||||
if [ "$(basename "$PWD")" != "AMR" ]; then
|
||||
echo "Error: The script must be run from the 'AMR' directory."
|
||||
exit 1
|
||||
fi
|
||||
|
||||
# Define the output file, located in ./data-raw
|
||||
version="$1"
|
||||
output_file="data-raw/gpt_training_text_v${version}.txt"
|
||||
|
||||
# Clear the output file if it exists
|
||||
echo "This files contains all context you must know about the AMR package for R." > "$output_file"
|
||||
echo -e "\n\n\n\n" >> "$output_file"
|
||||
|
||||
# Function to remove header block (delimited by # ======)
|
||||
remove_header() {
|
||||
sed '/# =\{6,\}/,/# =\{6,\}/d' "$1"
|
||||
}
|
||||
|
||||
# Process all .R files in the 'R' folder
|
||||
for file in R/*.R; do
|
||||
echo "THE PART HEREAFTER CONTAINS CONTENTS FROM FILE $file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
remove_header "$file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
done
|
||||
|
||||
# Process all .Rmd files in the 'vignettes' folder
|
||||
for file in vignettes/*.Rmd; do
|
||||
echo "THE PART HEREAFTER CONTAINS CONTENTS FROM FILE $file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
remove_header "$file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
done
|
||||
|
||||
# Process important metadata files (DESCRIPTION, NAMESPACE, index.md)
|
||||
for file in DESCRIPTION NAMESPACE index.md; do
|
||||
if [[ -f $file ]]; then
|
||||
echo "THE PART HEREAFTER CONTAINS CONTENTS FROM FILE $file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
cat "$file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
fi
|
||||
done
|
||||
|
||||
# Process test files (if available) in the 'tests' folder
|
||||
for file in tests/*.R; do
|
||||
echo "THE PART HEREAFTER CONTAINS CONTENTS FROM FILE $file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
remove_header "$file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
done
|
||||
|
||||
# Process all .Rd files from the 'man' folder
|
||||
for file in man/*.Rd; do
|
||||
echo "THE PART HEREAFTER CONTAINS CONTENTS FROM FILE $file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
remove_header "$file" >> "$output_file"
|
||||
echo -e "\n\n" >> "$output_file"
|
||||
done
|
Reference in New Issue
Block a user