Skip to content

Commit eff4c61

Browse files
committed
misc typos/fixes for 0.3.0:
- update README with latest params - ensure capture dir includes seconds - bump behaviors to 0.1.1
1 parent b59788e commit eff4c61

File tree

4 files changed

+16
-11
lines changed

4 files changed

+16
-11
lines changed

README.md

Lines changed: 8 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ Browsertrix Crawler includes a number of additional command-line options, explai
4646
The Browsertrix Crawler docker image currently accepts the following parameters:
4747

4848
```
49-
browsertrix-crawler [options]
49+
crawler [options]
5050
5151
Options:
5252
--help Show help [boolean]
@@ -74,18 +74,23 @@ Options:
7474
-c, --collection Collection name to crawl to (replay
7575
will be accessible under this name
7676
in pywb preview)
77-
[string] [default: "capture-2021-04-10T04-49-4"]
77+
[string] [default: "capture-YYYY-MM-DDTHH-MM-SS"]
7878
--headless Run in headless mode, otherwise
7979
start xvfb[boolean] [default: false]
8080
--driver JS driver for the crawler
8181
[string] [default: "/app/defaultDriver.js"]
8282
--generateCDX, --generatecdx, If set, generate index (CDXJ) for
8383
--generateCdx use with pywb after crawl is done
8484
[boolean] [default: false]
85+
--combineWARC, --combinewarc, If set, combine the warcs
86+
--combineWarc [boolean] [default: false]
87+
--rolloverSize If set, declare the rollover size
88+
[number] [default: 1000000000]
8589
--generateWACZ, --generatewacz, If set, generate wacz
8690
--generateWacz [boolean] [default: false]
8791
--logging Logging options for crawler, can
88-
include: stats, pywb, behaviors
92+
include: stats, pywb, behaviors,
93+
behaviors-debug
8994
[string] [default: "stats"]
9095
--text If set, extract text to the
9196
pages.jsonl file

crawler.js

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ class Crawler {
4848
this.profileDir = fs.mkdtempSync(path.join(os.tmpdir(), "profile-"));
4949

5050
const params = require("yargs")
51-
.usage("browsertrix-crawler [options]")
51+
.usage("crawler [options]")
5252
.option(this.cliOpts)
5353
.check((argv) => this.validateArgs(argv)).argv;
5454

@@ -193,7 +193,7 @@ class Crawler {
193193
alias: "c",
194194
describe: "Collection name to crawl to (replay will be accessible under this name in pywb preview)",
195195
type: "string",
196-
default: `capture-${new Date().toISOString().slice(0,18)}`.replace(/:/g, "-")
196+
default: `capture-${new Date().toISOString().slice(0,19)}`.replace(/:/g, "-")
197197
},
198198

199199
"headless": {
@@ -236,7 +236,7 @@ class Crawler {
236236
},
237237

238238
"logging": {
239-
describe: "Logging options for crawler, can include: stats, pywb, behaviors",
239+
describe: "Logging options for crawler, can include: stats, pywb, behaviors, behaviors-debug",
240240
type: "string",
241241
default: "stats",
242242
},

package.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@
77
"license": "MIT",
88
"dependencies": {
99
"abort-controller": "^3.0.0",
10-
"browsertrix-behaviors": "^0.1.0",
10+
"browsertrix-behaviors": "^0.1.1",
1111
"node-fetch": "^2.6.1",
1212
"puppeteer-cluster": "^0.22.0",
1313
"puppeteer-core": "^5.3.1",

yarn.lock

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1046,10 +1046,10 @@ browserslist@^4.14.5:
10461046
escalade "^3.1.1"
10471047
node-releases "^1.1.70"
10481048

1049-
browsertrix-behaviors@^0.1.0:
1050-
version "0.1.0"
1051-
resolved "https://registry.yarnpkg.com/browsertrix-behaviors/-/browsertrix-behaviors-0.1.0.tgz#202aabac6dcc2b15fe4777c3cc99d3d0cc042191"
1052-
integrity sha512-AfED59t8b7couu5Vzcy76BoWqCyHtYfmaR5t8ic1MoSfzz40d5WS4HfZqUWvOcoqsUfpJhjlc9R7nCptpQ6tNQ==
1049+
browsertrix-behaviors@^0.1.1:
1050+
version "0.1.1"
1051+
resolved "https://registry.yarnpkg.com/browsertrix-behaviors/-/browsertrix-behaviors-0.1.1.tgz#9b1b44698a6742ecb369a93354837f01307113d2"
1052+
integrity sha512-x7BbuUy3y0yVrXjbNGJT9uS5Pk1nWE9N/2ovre9z7ldV7tzjZBkWGkE14W2iZsuj4mMpJlnpIsAJMcOaYYTowA==
10531053

10541054
10551055
version "2.1.1"

0 commit comments

Comments
 (0)