Skip to content

Commit aa8786a

Browse files
committed
feat(#138): paths
1 parent 0aa6fe8 commit aa8786a

2 files changed

Lines changed: 15 additions & 13 deletions

File tree

.github/workflows/collect.yml

Lines changed: 8 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -59,16 +59,19 @@ jobs:
5959
just install
6060
poetry install
6161
just collect "collection/${{ inputs.out }}" "${{ inputs.start }}" \
62-
"${{ inputs.end }}" "repos" "$TOKEN"
63-
just filter "repos-with-pulls.csv" "after-filter.csv"
64-
just extract "after-filter.csv" "after-extract.csv"
65-
just maven "after-extract.csv" "$TOKEN" \
66-
"after-maven.csv"
62+
"${{ inputs.end }}" "repos"
63+
just pulls "../repos.csv" "$TOKEN" "../repos-with-pulls.csv"
64+
just filter "../repos-with-pulls.csv" "../after-filter.csv"
65+
just swc "../after-filter.csv" "../after-swc.csv"
66+
just extract "../after-swc.csv" "../after-extract.csv"
67+
just maven "../after-extract.csv" "$TOKEN" \
68+
"../after-maven.csv"
6769
} 2>&1 | tee -a collect.log
6870
sed -i "s|$TOKEN|REDACTED|g" collect.log
6971
cp "repos.csv" "collection/${{ inputs.out }}"
7072
cp "repos-with-pulls.csv" "collection/${{ inputs.out }}"
7173
cp "after-filter.csv" "collection/${{ inputs.out }}"
74+
cp "after-swc.csv" "collection/${{ inputs.out }}"
7275
cp "after-extract.csv" "collection/${{ inputs.out }}"
7376
cp "after-maven.csv" "collection/${{ inputs.out }}"
7477
cp "collect.log" collection/${{ inputs.out }}

justfile

Lines changed: 7 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -61,11 +61,10 @@ clean:
6161
rm sr-data/experiment/* && rmdir sr-data/experiment
6262

6363
# Collect repositories.
64-
collect dir start end out token:
64+
collect dir start end out:
6565
mkdir -p {{dir}}
6666
ghminer --query "stars:>10 language:java size:>=20 mirror:false template:false NOT android" \
6767
--start "{{start}}" --end "{{end}}" --tokens "$PATS" --filename "{{out}}"
68-
just pulls "../{{out}}.csv" "{{token}}" "../{{out}}-with-pulls.csv"
6968

7069
# Fetch pulls count for collected repos.
7170
pulls repos token out="experiment/with-pulls.csv":
@@ -74,8 +73,8 @@ pulls repos token out="experiment/with-pulls.csv":
7473

7574
# Collect maven pom.xml files.
7675
maven repos token out="experiment/with-maven.csv":
77-
cd sr-data && poetry poe maven --repos "../{{repos}}" --token "{{token}}" \
78-
--out "../{{out}}"
76+
cd sr-data && poetry poe maven --repos "{{repos}}" --token "{{token}}" \
77+
--out "{{out}}"
7978

8079
# Collect test repositories.
8180
test-collect:
@@ -86,16 +85,16 @@ test-collect:
8685

8786
# Filter collected repositories.
8887
filter repos out="experiment/after-filter.csv":
89-
cd sr-data && poetry poe filter --repos "../{{repos}}" --out "../{{out}}"
88+
cd sr-data && poetry poe filter --repos "{{repos}}" --out "{{out}}"
9089

9190
# Extract headings from README files.
9291
extract repos out="experiment/after-extract.csv":
93-
cd sr-data && poetry poe extract --repos "../{{repos}}" --out "../{{out}}"
92+
cd sr-data && poetry poe extract --repos "{{repos}}" --out "{{out}}"
9493

9594
# Special words count.
9695
swc repos out="experiment/after-swc.csv" config="resources/swc-words.txt":
97-
cd sr-data && poetry poe swc --repos {{repos}} --out {{out}} \
98-
--config {{config}}
96+
cd sr-data && poetry poe swc --repos "{{repos}}" --out "{{out}}" \
97+
--config "{{config}}"
9998

10099
# Create embeddings.
101100
embed repos prefix="experiment/embeddings":

0 commit comments

Comments
 (0)