tests: re-tool integration tests

This basically rewrites every integration test. We reduce the amount of magic involved here in terms of which arguments are being passed to ripgrep processes. To make up for the boiler plate saved by the magic, we make the Dir (formerly WorkDir) type a bit nicer to use, along with a new TestCommand that wraps a std::process::Command. In exchange, we get tests that are easier to read and write. We also run every test with the `--pcre2` flag to make sure that works, when PCRE2 is available.
author: Andrew Gallant <jamslam@gmail.com> 2018-08-06 20:11:58 -0400
committer: Andrew Gallant <jamslam@gmail.com> 2018-08-20 07:10:19 -0400
commit: eb184d7711a3d01b2fd3a4281b193f39f7e9a2c5 (patch)
tree: 6531c55af7eae5670d224d347763ad1e3216e8b4
parent: bb110c1ebeeda452046830b3991f705f5759da92 (diff)
11 files changed, 2807 insertions, 2412 deletions
diff --git a/Cargo.lock b/Cargo.lock
index 57d2975b..d11b1608 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -381,6 +381,8 @@ dependencies = [
  "num_cpus 1.8.0 (registry+https://github.com/rust-lang/crates.io-index)",
  "regex 1.0.2 (registry+https://github.com/rust-lang/crates.io-index)",
  "same-file 1.0.2 (registry+https://github.com/rust-lang/crates.io-index)",
+ "serde 1.0.70 (registry+https://github.com/rust-lang/crates.io-index)",
+ "serde_derive 1.0.70 (registry+https://github.com/rust-lang/crates.io-index)",
  "serde_json 1.0.24 (registry+https://github.com/rust-lang/crates.io-index)",
  "termcolor 1.0.1 (registry+https://github.com/rust-lang/crates.io-index)",
  "winapi 0.3.5 (registry+https://github.com/rust-lang/crates.io-index)",
diff --git a/Cargo.toml b/Cargo.toml
index 74648607..208a07b5 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -73,6 +73,10 @@ version = "2.29.4"
 default-features = false
 features = ["suggestions", "color"]
 
+[dev-dependencies]
+serde = "1"
+serde_derive = "1"
+
 [features]
 avx-accel = ["grep/avx-accel"]
 simd-accel = ["grep/simd-accel"]
diff --git a/tests/feature.rs b/tests/feature.rs
new file mode 100644
index 00000000..5b14a0d2
--- /dev/null
+++ b/tests/feature.rs
@@ -0,0 +1,631 @@
+use hay::{SHERLOCK, SHERLOCK_CRLF};
+use util::{Dir, TestCommand, sort_lines};
+
+// See: https://github.com/BurntSushi/ripgrep/issues/1
+rgtest!(f1_sjis, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_bytes(
+        "foo",
+        b"\x84Y\x84u\x84\x82\x84|\x84\x80\x84{ \x84V\x84\x80\x84|\x84}\x84\x83"
+    );
+    cmd.arg("-Esjis").arg("Шерлок Холмс");
+    eqnice!("foo:Шерлок Холмс\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/1
+rgtest!(f1_utf16_auto, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_bytes(
+        "foo",
+        b"\xff\xfe(\x045\x04@\x04;\x04>\x04:\x04 \x00%\x04>\x04;\x04<\x04A\x04"
+    );
+    cmd.arg("Шерлок Холмс");
+    eqnice!("foo:Шерлок Холмс\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/1
+rgtest!(f1_utf16_explicit, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_bytes(
+        "foo",
+        b"\xff\xfe(\x045\x04@\x04;\x04>\x04:\x04 \x00%\x04>\x04;\x04<\x04A\x04"
+    );
+    cmd.arg("-Eutf-16le").arg("Шерлок Холмс");
+    eqnice!("foo:Шерлок Холмс\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/1
+rgtest!(f1_eucjp, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_bytes(
+        "foo",
+        b"\xa7\xba\xa7\xd6\xa7\xe2\xa7\xdd\xa7\xe0\xa7\xdc \xa7\xb7\xa7\xe0\xa7\xdd\xa7\xde\xa7\xe3"
+    );
+    cmd.arg("-Eeuc-jp").arg("Шерлок Холмс");
+    eqnice!("foo:Шерлок Холмс\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/1
+rgtest!(f1_unknown_encoding, |_: Dir, mut cmd: TestCommand| {
+    cmd.arg("-Efoobar").assert_non_empty_stderr();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/1
+rgtest!(f1_replacement_encoding, |_: Dir, mut cmd: TestCommand| {
+    cmd.arg("-Ecsiso2022kr").assert_non_empty_stderr();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/7
+rgtest!(f7, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    dir.create("pat", "Sherlock\nHolmes");
+
+    let expected = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock
+Holmeses, success in the province of detective work must always
+be, to a very large extent, the result of luck. Sherlock Holmes
+";
+    eqnice!(expected, cmd.arg("-fpat").arg("sherlock").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/7
+rgtest!(f7_stdin, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    let expected = "\
+sherlock:For the Doctor Watsons of this world, as opposed to the Sherlock
+sherlock:be, to a very large extent, the result of luck. Sherlock Holmes
+";
+    eqnice!(expected, cmd.arg("-f-").pipe("Sherlock"));
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/20
+rgtest!(f20_no_filename, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    cmd.arg("--no-filename");
+
+    let expected = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock
+be, to a very large extent, the result of luck. Sherlock Holmes
+";
+    eqnice!(expected, cmd.arg("--no-filename").arg("Sherlock").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/34
+rgtest!(f34_only_matching, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    let expected = "\
+sherlock:Sherlock
+sherlock:Sherlock
+";
+    eqnice!(expected, cmd.arg("-o").arg("Sherlock").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/34
+rgtest!(f34_only_matching_line_column, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    let expected = "\
+sherlock:1:57:Sherlock
+sherlock:3:49:Sherlock
+";
+    cmd.arg("-o").arg("--column").arg("-n").arg("Sherlock");
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/45
+rgtest!(f45_relative_cwd, |dir: Dir, mut cmd: TestCommand| {
+    dir.create(".not-an-ignore", "foo\n/bar");
+    dir.create_dir("bar");
+    dir.create_dir("baz/bar");
+    dir.create_dir("baz/baz/bar");
+    dir.create("bar/test", "test");
+    dir.create("baz/bar/test", "test");
+    dir.create("baz/baz/bar/test", "test");
+    dir.create("baz/foo", "test");
+    dir.create("baz/test", "test");
+    dir.create("foo", "test");
+    dir.create("test", "test");
+
+    cmd.arg("-l").arg("test");
+
+    // First, get a baseline without applying ignore rules.
+    let expected = "
+bar/test
+baz/bar/test
+baz/baz/bar/test
+baz/foo
+baz/test
+foo
+test
+";
+    eqnice!(sort_lines(expected), sort_lines(&cmd.stdout()));
+
+    // Now try again with the ignore file activated.
+    cmd.arg("--ignore-file").arg(".not-an-ignore");
+    let expected = "
+baz/bar/test
+baz/baz/bar/test
+baz/test
+test
+";
+    eqnice!(sort_lines(expected), sort_lines(&cmd.stdout()));
+
+    // Now do it again, but inside the baz directory. Since the ignore file
+    // is interpreted relative to the CWD, this will cause the /bar anchored
+    // pattern to filter out baz/bar, which is a subtle difference between true
+    // parent ignore files and manually specified ignore files.
+    let mut cmd = dir.command();
+    cmd.args(&["--ignore-file", "../.not-an-ignore", "-l", "test"]);
+    cmd.current_dir(dir.path().join("baz"));
+    let expected = "
+baz/bar/test
+test
+";
+    eqnice!(sort_lines(expected), sort_lines(&cmd.stdout()));
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/45
+rgtest!(f45_precedence_with_others, |dir: Dir, mut cmd: TestCommand| {
+    dir.create(".not-an-ignore", "*.log");
+    dir.create(".ignore", "!imp.log");
+    dir.create("imp.log", "test");
+    dir.create("wat.log", "test");
+
+    cmd.arg("--ignore-file").arg(".not-an-ignore").arg("test");
+    eqnice!("imp.log:test\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/45
+rgtest!(f45_precedence_internal, |dir: Dir, mut cmd: TestCommand| {
+    dir.create(".not-an-ignore1", "*.log");
+    dir.create(".not-an-ignore2", "!imp.log");
+    dir.create("imp.log", "test");
+    dir.create("wat.log", "test");
+
+    cmd.args(&[
+        "--ignore-file", ".not-an-ignore1",
+        "--ignore-file", ".not-an-ignore2",
+        "test",
+    ]);
+    eqnice!("imp.log:test\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/68
+rgtest!(f68_no_ignore_vcs, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_dir(".git");
+    dir.create(".gitignore", "foo");
+    dir.create(".ignore", "bar");
+    dir.create("foo", "test");
+    dir.create("bar", "test");
+
+    eqnice!("foo:test\n", cmd.arg("--no-ignore-vcs").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/70
+rgtest!(f70_smart_case, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    let expected = "\
+sherlock:For the Doctor Watsons of this world, as opposed to the Sherlock
+sherlock:be, to a very large extent, the result of luck. Sherlock Holmes
+";
+    eqnice!(expected, cmd.arg("-S").arg("sherlock").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/89
+rgtest!(f89_files_with_matches, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    cmd.arg("--null").arg("--files-with-matches").arg("Sherlock");
+    eqnice!("sherlock\x00", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/89
+rgtest!(f89_files_without_match, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    dir.create("file.py", "foo");
+
+    cmd.arg("--null").arg("--files-without-match").arg("Sherlock");
+    eqnice!("file.py\x00", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/89
+rgtest!(f89_count, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    cmd.arg("--null").arg("--count").arg("Sherlock");
+    eqnice!("sherlock\x002\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/89
+rgtest!(f89_files, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    eqnice!("sherlock\x00", cmd.arg("--null").arg("--files").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/89
+rgtest!(f89_match, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    let expected = "\
+sherlock\x00For the Doctor Watsons of this world, as opposed to the Sherlock
+sherlock\x00Holmeses, success in the province of detective work must always
+sherlock\x00be, to a very large extent, the result of luck. Sherlock Holmes
+sherlock\x00can extract a clew from a wisp of straw or a flake of cigar ash;
+";
+    eqnice!(expected, cmd.arg("--null").arg("-C1").arg("Sherlock").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/109
+rgtest!(f109_max_depth, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_dir("one");
+    dir.create("one/pass", "far");
+    dir.create_dir("one/too");
+    dir.create("one/too/many", "far");
+
+    cmd.arg("--maxdepth").arg("2").arg("far");
+    eqnice!("one/pass:far\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/124
+rgtest!(f109_case_sensitive_part1, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "tEsT");
+
+    cmd.arg("--smart-case").arg("--case-sensitive").arg("test").assert_err();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/124
+rgtest!(f109_case_sensitive_part2, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "tEsT");
+    cmd.arg("--ignore-case").arg("--case-sensitive").arg("test").assert_err();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/129
+rgtest!(f129_matches, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test\ntest abcdefghijklmnopqrstuvwxyz test");
+
+    let expected = "foo:test\nfoo:[Omitted long matching line]\n";
+    eqnice!(expected, cmd.arg("-M26").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/129
+rgtest!(f129_context, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test\nabcdefghijklmnopqrstuvwxyz");
+
+    let expected = "foo:test\nfoo-[Omitted long context line]\n";
+    eqnice!(expected, cmd.arg("-M20").arg("-C1").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/129
+rgtest!(f129_replace, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test\ntest abcdefghijklmnopqrstuvwxyz test");
+
+    let expected = "foo:foo\nfoo:[Omitted long line with 2 matches]\n";
+    eqnice!(expected, cmd.arg("-M26").arg("-rfoo").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/159
+rgtest!(f159_max_count, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test\ntest");
+
+    eqnice!("foo:test\n", cmd.arg("-m1").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/159
+rgtest!(f159_max_count_zero, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test\ntest");
+
+    cmd.arg("-m0").arg("test").assert_err();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/196
+rgtest!(f196_persistent_config, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    cmd.arg("sherlock").arg("sherlock");
+
+    // Make sure we get no matches by default.
+    cmd.assert_err();
+
+    // Now add our config file, and make sure it impacts ripgrep.
+    dir.create(".ripgreprc", "--ignore-case");
+    cmd.cmd().env("RIPGREP_CONFIG_PATH", ".ripgreprc");
+
+    let expected = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock
+be, to a very large extent, the result of luck. Sherlock Holmes
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/243
+rgtest!(f243_column_line, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test");
+
+    eqnice!("foo:1:1:test\n", cmd.arg("--column").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/263
+rgtest!(f263_sort_files, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("foo", "test");
+    dir.create("abc", "test");
+    dir.create("zoo", "test");
+    dir.create("bar", "test");
+
+    let expected = "abc:test\nbar:test\nfoo:test\nzoo:test\n";
+    eqnice!(expected, cmd.arg("--sort-files").arg("test").stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/275
+rgtest!(f275_pathsep, |dir: Dir, mut cmd: TestCommand| {
+    dir.create_dir("foo");
+    dir.create("foo/bar", "test");
+
+    cmd.arg("test").arg("--path-separator").arg("Z");
+    eqnice!("fooZbar:test\n", cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/362
+rgtest!(f362_dfa_size_limit, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    // This should fall back to the nfa engine but should still produce the
+    // expected result.
+    cmd.arg("--dfa-size-limit").arg("10").arg(r"For\s").arg("sherlock");
+
+    let expected = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/362
+rgtest!(f362_exceeds_regex_size_limit, |dir: Dir, mut cmd: TestCommand| {
+    // --regex-size-limit doesn't apply to PCRE2.
+    if dir.is_pcre2() {
+        return;
+    }
+    cmd.arg("--regex-size-limit").arg("10K").arg(r"[0-9]\w+").assert_err();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/362
+#[cfg(target_pointer_width = "32")]
+rgtest!(f362_u64_to_narrow_usize_overflow, |dir: Dir, mut cmd: TestCommand| {
+    // --dfa-size-limit doesn't apply to PCRE2.
+    if dir.is_pcre2() {
+        return;
+    }
+    dir.create_size("foo", 1000000);
+
+    // 2^35 * 2^20 is ok for u64, but not for usize
+    cmd.arg("--dfa-size-limit").arg("34359738368M").arg("--files");
+    cmd.assert_err();
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/411
+rgtest!(f411_single_threaded_search_stats, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    let lines = cmd.arg("--stats").arg("Sherlock").stdout();
+    assert!(lines.contains("2 matched lines"));
+    assert!(lines.contains("1 files contained matches"));
+    assert!(lines.contains("1 files searched"));
+    assert!(lines.contains("seconds"));
+});
+
+rgtest!(f411_parallel_search_stats, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock_1", SHERLOCK);
+    dir.create("sherlock_2", SHERLOCK);
+
+    let lines = cmd.arg("--stats").arg("Sherlock").stdout();
+    assert!(lines.contains("4 matched lines"));
+    assert!(lines.contains("2 files contained matches"));
+    assert!(lines.contains("2 files searched"));
+    assert!(lines.contains("seconds"));
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/416
+rgtest!(f416_crlf, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK_CRLF);
+    cmd.arg("--crlf").arg(r"Sherlock$").arg("sherlock");
+
+    let expected = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock\r
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/416
+rgtest!(f416_crlf_multiline, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK_CRLF);
+    cmd.arg("--crlf").arg("-U").arg(r"Sherlock$").arg("sherlock");
+
+    let expected = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock\r
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/416
+rgtest!(f416_crlf_only_matching, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK_CRLF);
+    cmd.arg("--crlf").arg("-o").arg(r"Sherlock$").arg("sherlock");
+
+    let expected = "\
+Sherlock\r
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/419
+rgtest!(f419_zero_as_shortcut_for_null, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+
+    cmd.arg("-0").arg("--count").arg("Sherlock");
+    eqnice!("sherlock\x002\n", cmd.stdout());
+});
+
+rgtest!(f740_passthru, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("file", "\nfoo\nbar\nfoobar\n\nbaz\n");
+    dir.create("patterns", "foo\nbar\n");
+
+    // We can't assume that the way colour specs are translated to ANSI
+    // sequences will remain stable, and --replace doesn't currently work with
+    // pass-through, so for now we don't actually test the match sub-strings
+    let common_args = &["-n", "--passthru"];
+    let foo_expected = "\
+1-
+2:foo
+3-bar
+4:foobar
+5-
+6-baz
+";
+
+    // With single pattern
+    cmd.args(common_args).arg("foo").arg("file");
+    eqnice!(foo_expected, cmd.stdout());
+
+    let foo_bar_expected = "\
+1-
+2:foo
+3:bar
+4:foobar
+5-
+6-baz
+";
+
+    // With multiple -e patterns
+    let mut cmd = dir.command();
+    cmd.args(common_args);
+    cmd.args(&["-e", "foo", "-e", "bar", "file"]);
+    eqnice!(foo_bar_expected, cmd.stdout());
+
+    // With multiple -f patterns
+    let mut cmd = dir.command();
+    cmd.args(common_args);
+    cmd.args(&["-f", "patterns", "file"]);
+    eqnice!(foo_bar_expected, cmd.stdout());
+
+    // -c should override
+    let mut cmd = dir.command();
+    cmd.args(common_args);
+    cmd.args(&["-c", "foo", "file"]);
+    eqnice!("2\n", cmd.stdout());
+
+    let only_foo_expected = "\
+1-
+2:foo
+3-bar
+4:foo
+5-
+6-baz
+";
+
+    // -o should work
+    let mut cmd = dir.command();
+    cmd.args(common_args);
+    cmd.args(&["-o", "foo", "file"]);
+    eqnice!(only_foo_expected, cmd.stdout());
+
+    let replace_foo_expected = "\
+1-
+2:wat
+3-bar
+4:watbar
+5-
+6-baz
+";
+
+    // -r should work
+    let mut cmd = dir.command();
+    cmd.args(common_args);
+    cmd.args(&["-r", "wat", "foo", "file"]);
+    eqnice!(replace_foo_expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/948
+rgtest!(f948_exit_code_match, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    cmd.arg(".");
+
+    cmd.assert_exit_code(0);
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/948
+rgtest!(f948_exit_code_no_match, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    cmd.arg("NADA");
+
+    cmd.assert_exit_code(1);
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/948
+rgtest!(f948_exit_code_error, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    cmd.arg("*");
+
+    cmd.assert_exit_code(2);
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/917
+rgtest!(f917_trim, |dir: Dir, mut cmd: TestCommand| {
+const SHERLOCK: &'static str = "\
+zzz
+    For the Doctor Watsons of this world, as opposed to the Sherlock
+  Holmeses, success in the province of detective work must always
+\tbe, to a very large extent, the result of luck. Sherlock Holmes
+     can extract a clew from a wisp of straw or a flake of cigar ash;
+but Doctor Watson has to have it taken out for him and dusted,
+ and exhibited clearly, with a label attached.
+";
+    dir.create("sherlock", SHERLOCK);
+    cmd.args(&[
+        "-n", "-B1", "-A2", "--trim", "Holmeses", "sherlock",
+    ]);
+
+    let expected = "\
+2-For the Doctor Watsons of this world, as opposed to the Sherlock
+3:Holmeses, success in the province of detective work must always
+4-be, to a very large extent, the result of luck. Sherlock Holmes
+5-can extract a clew from a wisp of straw or a flake of cigar ash;
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/917
+//
+// This is like f917_trim, except this tests that trimming occurs even when the
+// whitespace is part of a match.
+rgtest!(f917_trim_match, |dir: Dir, mut cmd: TestCommand| {
+const SHERLOCK: &'static str = "\
+zzz
+    For the Doctor Watsons of this world, as opposed to the Sherlock
+  Holmeses, success in the province of detective work must always
+\tbe, to a very large extent, the result of luck. Sherlock Holmes
+     can extract a clew from a wisp of straw or a flake of cigar ash;
+but Doctor Watson has to have it taken out for him and dusted,
+ and exhibited clearly, with a label attached.
+";
+    dir.create("sherlock", SHERLOCK);
+    cmd.args(&[
+        "-n", "-B1", "-A2", "--trim", r"\s+Holmeses", "sherlock",
+    ]);
+
+    let expected = "\
+2-For the Doctor Watsons of this world, as opposed to the Sherlock
+3:Holmeses, success in the province of detective work must always
+4-be, to a very large extent, the result of luck. Sherlock Holmes
+5-can extract a clew from a wisp of straw or a flake of cigar ash;
+";
+    eqnice!(expected, cmd.stdout());
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/993
+rgtest!(f993_null_data, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("test", "foo\x00bar\x00\x00\x00baz\x00");
+    cmd.arg("--null-data").arg(r".+").arg("test");
+
+    // If we just used -a instead of --null-data, then the result would include
+    // all NUL bytes.
+    let expected = "foo\x00bar\x00baz\x00";
+    eqnice!(expected, cmd.stdout());
+});
diff --git a/tests/hay.rs b/tests/hay.rs
index 74d2f6cc..15a53b15 100644
--- a/tests/hay.rs
+++ b/tests/hay.rs
@@ -7,18 +7,11 @@ but Doctor Watson has to have it taken out for him and dusted,
 and exhibited clearly, with a label attached.
 ";
 
-pub const CODE: &'static str = "\
-extern crate snap;
-
-use std::io;
-
-fn main() {
-    let stdin = io::stdin();
-    let stdout = io::stdout();
-
-    // Wrap the stdin reader in a Snappy reader.
-    let mut rdr = snap::Reader::new(stdin.lock());
-    let mut wtr = stdout.lock();
-    io::copy(&mut rdr, &mut wtr).expect(\"I/O operation failed\");
-}
+pub const SHERLOCK_CRLF: &'static str = "\
+For the Doctor Watsons of this world, as opposed to the Sherlock\r
+Holmeses, success in the province of detective work must always\r
+be, to a very large extent, the result of luck. Sherlock Holmes\r
+can extract a clew from a wisp of straw or a flake of cigar ash;\r
+but Doctor Watson has to have it taken out for him and dusted,\r
+and exhibited clearly, with a label attached.\r
 ";
diff --git a/tests/json.rs b/tests/json.rs
new file mode 100644
index 00000000..4433103d
--- /dev/null
+++ b/tests/json.rs
@@ -0,0 +1,263 @@
+use std::time;
+
+use serde_json as json;
+
+use hay::{SHERLOCK, SHERLOCK_CRLF};
+use util::{Dir, TestCommand};
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+#[serde(tag = "type", content = "data")]
+#[serde(rename_all = "snake_case")]
+enum Message {
+    Begin(Begin),
+    End(End),
+    Match(Match),
+    Context(Context),
+    Summary(Summary),
+}
+
+impl Message {
+    fn unwrap_begin(&self) -> Begin {
+        match *self {
+            Message::Begin(ref x) => x.clone(),
+            ref x => panic!("expected Message::Begin but got {:?}", x),
+        }
+    }
+
+    fn unwrap_end(&self) -> End {
+        match *self {
+            Message::End(ref x) => x.clone(),
+            ref x => panic!("expected Message::End but got {:?}", x),
+        }
+    }
+
+    fn unwrap_match(&self) -> Match {
+        match *self {
+            Message::Match(ref x) => x.clone(),
+            ref x => panic!("expected Message::Match but got {:?}", x),
+        }
+    }
+
+    fn unwrap_context(&self) -> Context {
+        match *self {
+            Message::Context(ref x) => x.clone(),
+            ref x => panic!("expected Message::Context but got {:?}", x),
+        }
+    }
+
+    fn unwrap_summary(&self) -> Summary {
+        match *self {
+            Message::Summary(ref x) => x.clone(),
+            ref x => panic!("expected Message::Summary but got {:?}", x),
+        }
+    }
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct Begin {
+    path: Option<Data>,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct End {
+    path: Option<Data>,
+    binary_offset: Option<u64>,
+    stats: Stats,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct Summary {
+    elapsed_total: Duration,
+    stats: Stats,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct Match {
+    path: Option<Data>,
+    lines: Data,
+    line_number: Option<u64>,
+    absolute_offset: u64,
+    submatches: Vec<SubMatch>,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct Context {
+    path: Option<Data>,
+    lines: Data,
+    line_number: Option<u64>,
+    absolute_offset: u64,
+    submatches: Vec<SubMatch>,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct SubMatch {
+    #[serde(rename = "match")]
+    m: Data,
+    start: usize,
+    end: usize,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+#[serde(untagged)]
+enum Data {
+    Text { text: String },
+    // This variant is used when the data isn't valid UTF-8. The bytes are
+    // base64 encoded, so using a String here is OK.
+    Bytes { bytes: String },
+}
+
+impl Data {
+    fn text(s: &str) -> Data { Data::Text { text: s.to_string() } }
+    fn bytes(s: &str) -> Data { Data::Bytes { bytes: s.to_string() } }
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct Stats {
+    elapsed: Duration,
+    searches: u64,
+    searches_with_match: u64,
+    bytes_searched: u64,
+    bytes_printed: u64,
+    matched_lines: u64,
+    matches: u64,
+}
+
+#[derive(Clone, Debug, Deserialize, PartialEq, Eq)]
+struct Duration {
+    #[serde(flatten)]
+    duration: time::Duration,
+    human: String,
+}
+
+/// Decode JSON Lines into a Vec<Message>. If there was an error decoding,
+/// this function panics.
+fn json_decode(jsonlines: &str) -> Vec<Message> {
+    json::Deserializer::from_str(jsonlines)
+        .into_iter()
+        .collect::<Result<Vec<Message>, _>>()
+        .unwrap()
+}
+
+rgtest!(basic, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK);
+    cmd.arg("--json").arg("-B1").arg("Sherlock Holmes").arg("sherlock");
+
+    let msgs = json_decode(&cmd.stdout());
+
+    assert_eq!(
+        msgs[0].unwrap_begin(),
+        Begin { path: Some(Data::text("sherlock")) }
+    );
+    assert_eq!(
+        msgs[1].unwrap_context(),
+        Context {
+            path: Some(Data::text("sherlock")),
+            lines: Data::text("Holmeses, success in the province of detective work must always\n"),
+            line_number: Some(2),
+            absolute_offset: 65,
+            submatches: vec![],
+        }
+    );
+    assert_eq!(
+        msgs[2].unwrap_match(),
+        Match {
+            path: Some(Data::text("sherlock")),
+            lines: Data::text("be, to a very large extent, the result of luck. Sherlock Holmes\n"),
+            line_number: Some(3),
+            absolute_offset: 129,
+            submatches: vec![
+                SubMatch {
+                    m: Data::text("Sherlock Holmes"),
+                    start: 48,
+                    end: 63,
+                },
+            ],
+        }
+    );
+    assert_eq!(
+        msgs[3].unwrap_end().path,
+        Some(Data::text("sherlock"))
+    );
+    assert_eq!(
+        msgs[3].unwrap_end().binary_offset,
+        None
+    );
+    assert_eq!(
+        msgs[4].unwrap_summary().stats.searches_with_match,
+        1
+    );
+    assert_eq!(
+        msgs[4].unwrap_summary().stats.bytes_printed,
+        494
+    );
+});
+
+#[cfg(unix)]
+rgtest!(notutf8, |dir: Dir, mut cmd: TestCommand| {
+    use std::ffi::OsStr;
+    use std::os::unix::ffi::OsStrExt;
+
+    // This test does not work with PCRE2 because PCRE2 does not support the
+    // `u` flag.
+    if dir.is_pcre2() {
+        return;
+    }
+    // macOS doesn't like this either... sigh.
+    if cfg!(target_os = "macos") {
+        return;
+    }
+
+    let name = &b"foo\xFFbar"[..];
+    let contents = &b"quux\xFFbaz"[..];
+
+    // APFS does not support creating files with invalid UTF-8 bytes, so just
+    // skip the test if we can't create our file.
+    if !dir.try_create_bytes(OsStr::from_bytes(name), contents).is_ok() {
+        return;
+    }
+    cmd.arg("--json").arg(r"(?-u)\xFF");
+
+    let msgs = json_decode(&cmd.stdout());
+
+    assert_eq!(
+        msgs[0].unwrap_begin(),
+        Begin { path: Some(Data::bytes("Zm9v/2Jhcg==")) }
+    );
+    assert_eq!(
+        msgs[1].unwrap_match(),
+        Match {
+            path: Some(Data::bytes("Zm9v/2Jhcg==")),
+            lines: Data::bytes("cXV1eP9iYXo="),
+            line_number: Some(1),
+            absolute_offset: 0,
+            submatches: vec![
+                SubMatch {
+                    m: Data::bytes("/w=="),
+                    start: 4,
+                    end: 5,
+                },
+            ],
+        }
+    );
+});
+
+// See: https://github.com/BurntSushi/ripgrep/issues/416
+//
+// This test in particular checks that our match does _not_ include the `\r`
+// even though the '$' may be rewritten as '(?:\r??$)' and could thus include
+// `\r` in the match.
+rgtest!(crlf, |dir: Dir, mut cmd: TestCommand| {
+    dir.create("sherlock", SHERLOCK_CRLF);
+    cmd.arg("--json").arg("--crlf").arg(r"Sherlock$").arg("sherlock");
+
+    let msgs = json_decode(&cmd.stdout());
+
+    assert_eq!(
+        msgs[1].unwrap_match().submatches[0].clone(),
+        SubMatch {
+            m: Data::text("Sherlock"),
+            start: 56,
+            end: 64,
+        },
+    );
+});
diff --git a/tests/macros.rs b/tests/macros.rs
new file mode 100644
index 00000000..24bf13f8
--- /dev/null
+++ b/tests/macros.rs
@@ -0,0 +1,61 @@
+#[macro_export]
+macro_rules! rgtest {
+    ($name:ident, $fun:expr) => {
+        #[test]
+        fn $name() {
+            let (dir, cmd) = ::util::setup(stringify!($name));
+            $fun(dir, cmd);
+
+            if cfg!(feature = "pcre2") {
+                let (dir, cmd) = ::util::setup_pcre2(stringify!($name));
+                $fun(dir, cmd);
+            }
+        }
+    }
+}
+
+#[macro_export]
author	Andrew Gallant <jamslam@gmail.com>	2018-08-06 20:11:58 -0400
committer	Andrew Gallant <jamslam@gmail.com>	2018-08-20 07:10:19 -0400
commit	eb184d7711a3d01b2fd3a4281b193f39f7e9a2c5 (patch)
tree	6531c55af7eae5670d224d347763ad1e3216e8b4
parent	bb110c1ebeeda452046830b3991f705f5759da92 (diff)