D12392: merge-lists: make it possible to specify pattern to match

martinvonz (Martin von Zweigbergk) phabricator at mercurial-scm.org
Tue Mar 22 04:58:52 UTC 2022


martinvonz created this revision.
Herald added a reviewer: hg-reviewers.
Herald added a subscriber: mercurial-patches.

REVISION SUMMARY
  The `merge-lists` tool doesn't know anything about Python other than
  its regex that attempts to match import lines. Let's make it possible
  to pass in a custom regex so it's easy to use the tool for e.g. C/C++
  `#include` lines or Rust `use` lines (given the limited).

REPOSITORY
  rHG Mercurial

BRANCH
  default

REVISION DETAIL
  https://phab.mercurial-scm.org/D12392

AFFECTED FILES
  contrib/merge-lists/src/main.rs
  contrib/merge-lists/tests/test-merge-lists.rs

CHANGE DETAILS

diff --git a/contrib/merge-lists/tests/test-merge-lists.rs b/contrib/merge-lists/tests/test-merge-lists.rs
--- a/contrib/merge-lists/tests/test-merge-lists.rs
+++ b/contrib/merge-lists/tests/test-merge-lists.rs
@@ -1,7 +1,8 @@
 use similar::DiffableStr;
+use std::ffi::OsStr;
 use tempdir::TempDir;
 
-fn run_test(input: &str) -> String {
+fn run_test(arg: &str, input: &str) -> String {
     let mut cmd = assert_cmd::Command::cargo_bin("merge-lists").unwrap();
     let temp_dir = TempDir::new("test").unwrap();
     let base_path = temp_dir.path().join("base");
@@ -16,6 +17,7 @@
     std::fs::write(&local_path, split.next().unwrap()).unwrap();
     std::fs::write(&other_path, split.next().unwrap()).unwrap();
     cmd.args(&[
+        OsStr::new(arg),
         local_path.as_os_str(),
         base_path.as_os_str(),
         other_path.as_os_str(),
@@ -38,6 +40,7 @@
 #[test]
 fn test_merge_lists_basic() {
     let output = run_test(
+        "--python-imports",
         r"
 base:
 import lib1
@@ -72,6 +75,7 @@
     // Test some "from x import y" statements and some non-import conflicts
     // (unresolvable)
     let output = run_test(
+        "--python-imports",
         r"
 base:
 from . import x
@@ -116,6 +120,7 @@
     // Test that nothing is done if the elements in the conflicting hunks are
     // not sorted
     let output = run_test(
+        "--python-imports",
         r"
 base:
 import x
@@ -154,3 +159,46 @@
     3+3
     "###);
 }
+
+#[test]
+fn test_custom_regex() {
+    // Test merging of all lines (by matching anything)
+    let output = run_test(
+        "--pattern=.*",
+        r"
+base:
+aardvark
+baboon
+camel
+
+local:
+aardvark
+camel
+eagle
+
+other:
+aardvark
+camel
+deer
+",
+    );
+    insta::assert_snapshot!(output, @r###"
+    base:
+    aardvark
+    camel
+    deer
+    eagle
+
+    local:
+    aardvark
+    camel
+    deer
+    eagle
+
+    other:
+    aardvark
+    camel
+    deer
+    eagle
+    "###);
+}
diff --git a/contrib/merge-lists/src/main.rs b/contrib/merge-lists/src/main.rs
--- a/contrib/merge-lists/src/main.rs
+++ b/contrib/merge-lists/src/main.rs
@@ -1,3 +1,4 @@
+use clap::ArgMatches;
 use itertools::Itertools;
 use regex::bytes::Regex;
 use similar::ChangeTag;
@@ -143,11 +144,34 @@
     (new_base_bytes, new_local_bytes, new_other_bytes)
 }
 
+fn get_regex(matches: &ArgMatches) -> Regex {
+    let pattern = if matches.is_present("python") {
+        r"import \w+(\.\w+)*( +#.*)?\n|from (\w+(\.\w+)* import \w+( as \w+)?(, \w+( as \w+)?)*( +#.*)?)"
+    } else if let Some(pattern) = matches.value_of("pattern") {
+        pattern
+    } else {
+        ".*"
+    };
+    let pattern = format!(r"{}\r?\n?", pattern);
+    regex::bytes::Regex::new(&pattern).unwrap()
+}
+
 fn main() {
     let app = clap::Command::new("merge-lists")
         .arg(clap::Arg::new("local").index(1).required(true))
         .arg(clap::Arg::new("base").index(2).required(true))
-        .arg(clap::Arg::new("other").index(3).required(true));
+        .arg(clap::Arg::new("other").index(3).required(true))
+        .arg(
+            clap::Arg::new("pattern")
+                .long("pattern")
+                .short('p')
+                .takes_value(true),
+        )
+        .arg(
+            clap::Arg::new("python")
+                .long("python-imports")
+                .conflicts_with("pattern"),
+        );
     let matches = app.get_matches();
 
     let base_path = PathBuf::from(matches.value_of("base").unwrap());
@@ -158,8 +182,7 @@
     let local_bytes = std::fs::read(&local_path).unwrap();
     let other_bytes = std::fs::read(&other_path).unwrap();
 
-    let regex =
-        regex::bytes::Regex::new(r"import \w+(\.\w+)*( +#.*)?\n|from (\w+(\.\w+)* import \w+( as \w+)?(, \w+( as \w+)?)*( +#.*)?)\r?\n?").unwrap();
+    let regex = get_regex(&matches);
     let (new_base_bytes, new_local_bytes, new_other_bytes) =
         resolve(&base_bytes, &local_bytes, &other_bytes, &regex);
     // Write out the result if anything changed



To: martinvonz, #hg-reviewers
Cc: mercurial-patches, mercurial-devel


More information about the Mercurial-devel mailing list