[PATCH v2 0/2] [GSOC][RFC] ref-filter: introduce enum atom_type

"ZheNing Hu via GitGitGadget" <gitgitgadget@xxxxxxxxx> · Mon, 10 May 2021 15:03:17 +0000

Change from last version:

 * Remove the atom_type member from valid_atom at the suggestion of
   Christian and Junio, and use ATOM_* as the coordinates of valid_atom.
 * Add ATOM_INVALID and ATOM_UNKNOWN under Christian's suggestion, we can
   traverse valid_atom through them.
 * Add a note about enum atom_type to remind readers of its role.

ZheNing Hu (2):
  [GSOC] ref-filter: add objectsize to used_atom
  [GSOC] ref-filter: introduce enum atom_type

 ref-filter.c | 231 ++++++++++++++++++++++++++++++++++-----------------
 1 file changed, 155 insertions(+), 76 deletions(-)

base-commit: 7e391989789db82983665667013a46eabc6fc570
Published-As: https://github.com/gitgitgadget/git/releases/tag/pr-951%2Fadlternative%2Fref-filter-atom-type-v2
Fetch-It-Via: git fetch https://github.com/gitgitgadget/git pr-951/adlternative/ref-filter-atom-type-v2
Pull-Request: https://github.com/gitgitgadget/git/pull/951

Range-diff vs v1:

 1:  91ca57c9d04a = 1:  91ca57c9d04a [GSOC] ref-filter: add objectsize to used_atom
 2:  3770df182983 ! 2:  a1f70b39b7ef [GSOC][RFC] ref-filter: introduce enum atom_type
     @@ Metadata
      Author: ZheNing Hu <adlternative@xxxxxxxxx>

       ## Commit message ##
     -    [GSOC][RFC] ref-filter: introduce enum atom_type
     +    [GSOC] ref-filter: introduce enum atom_type

          In the original ref-filter design, it will copy the parsed
          atom's name and attributes to `used_atom[i].name` in the
     @@ Commit message
          in the later specific ref attributes filling step. It use
          a lot of string matching to determine which atom we need.

     -    Introduce the enum member `valid_atom.atom_type` which
     -    record type of each valid_atom, in the first step of the
     -    atom parsing, `used_atom.atom_type` will record corresponding
     -    enum value from `valid_atom.atom_type`, and then in specific
     -    reference attribute filling step, only need to compare the
     -    value of the `used_atom.atom_type` to judge the atom type.
     +    Introduce the enum "atom_type", each enum value is named
     +    as `ATOM_*`, which is the index of each corresponding
     +    valid_atom entry. In the first step of the atom parsing,
     +    `used_atom.atom_type` will record corresponding enum value
     +    from valid_atom entry index, and then in specific reference
     +    attribute filling step, only need to compare the value of
     +    the `used_atom.atom_type` to judge the atom type.

     -    At the same time, The value of an atom_type is the coordinate
     -    of its corresponding valid_atom entry, we can quickly index
     -    to the corresponding valid_atom entry by the atom_type value.
     +    the enum value of `ATOM_UNKNOWN` is equals to zero, which
     +    could ensure that we can easily distinguish such a struct
     +    where the atom_type is known from such a struct where it
     +    is unknown yet.
     +
     +    the enum value of `ATOM_INVALID` is equals to the size of
     +    valid_atom array, which could help us iterate over
     +    valid_atom array using something like:
     +
     +    for (i = ATOM_UNKNOWN + 1; i < ATOM_INVALID; i++)
     +            /* do something with valid_atom[i] */;

          Signed-off-by: ZheNing Hu <adlternative@xxxxxxxxx>

     @@ ref-filter.c: static struct ref_to_worktree_map {
       	struct worktree **worktrees;
       } ref_to_worktree_map;

     ++/*
     ++ * The enum atom_type is used as the coordinates of valid_atom entry.
     ++ * In the atom parsing stage, it will be passed to used_atom.atom_type
     ++ * as the identifier of the atom type. We can judge the type of used_atom
     ++ * entry by `if (used_atom[i].atom_type == ATOM_*)`.
     ++ *
     ++ * ATOM_UNKNOWN equals to 0, used as an enumeration value of uninitialized
     ++ * atom_type.
     ++ * ATOM_INVALID equals to the size of valid_atom array, which could help us
     ++ * iterate over valid_atom array like this:
     ++ *
     ++ * 	for (i = ATOM_UNKNOWN + 1; i < ATOM_INVALID; i++) {
     ++ *		int len = strlen(valid_atom[i].name);
     ++ *		if (len == atom_len && !memcmp(valid_atom[i].name, sp, len))
     ++ *			break;
     ++ *	}
     ++ */
      +enum atom_type {
     ++ATOM_UNKNOWN,
      +ATOM_REFNAME,
      +ATOM_OBJECTTYPE,
      +ATOM_OBJECTSIZE,
     @@ ref-filter.c: static struct ref_to_worktree_map {
      +ATOM_IF,
      +ATOM_THEN,
      +ATOM_ELSE,
     ++ATOM_INVALID,
      +};
      +
       /*
        * An atom is a valid field atom listed below, possibly prefixed with
        * a "*" to denote deref_tag().
     -@@ ref-filter.c: static struct used_atom {
     - 	const char *name;
     - 	cmp_type type;
     - 	info_source source;
     -+	enum atom_type atom_type;
     - 	union {
     - 		char color[COLOR_MAXLEN];
     - 		struct align align;
     -@@ ref-filter.c: static int head_atom_parser(const struct ref_format *format, struct used_atom *a
     - }
     - 
     - static struct {
     +@@ ref-filter.c: static struct ref_to_worktree_map {
     +  * array.
     +  */
     + static struct used_atom {
      +	enum atom_type atom_type;
       	const char *name;
     + 	cmp_type type;
       	info_source source;
     - 	cmp_type cmp_type;
     +@@ ref-filter.c: static struct {
       	int (*parser)(const struct ref_format *format, struct used_atom *atom,
       		      const char *arg, struct strbuf *err);
       } valid_atom[] = {
     @@ ref-filter.c: static int head_atom_parser(const struct ref_format *format, struc
      -	{ "if", SOURCE_NONE, FIELD_STR, if_atom_parser },
      -	{ "then", SOURCE_NONE },
      -	{ "else", SOURCE_NONE },
     -+	{ ATOM_REFNAME, "refname", SOURCE_NONE, FIELD_STR, refname_atom_parser },
     -+	{ ATOM_OBJECTTYPE, "objecttype", SOURCE_OTHER, FIELD_STR, objecttype_atom_parser },
     -+	{ ATOM_OBJECTSIZE, "objectsize", SOURCE_OTHER, FIELD_ULONG, objectsize_atom_parser },
     -+	{ ATOM_OBJECTNAME, "objectname", SOURCE_OTHER, FIELD_STR, oid_atom_parser },
     -+	{ ATOM_DELTABASE, "deltabase", SOURCE_OTHER, FIELD_STR, deltabase_atom_parser },
     -+	{ ATOM_TREE, "tree", SOURCE_OBJ, FIELD_STR, oid_atom_parser },
     -+	{ ATOM_PARENT, "parent", SOURCE_OBJ, FIELD_STR, oid_atom_parser },
     -+	{ ATOM_NUMPARENT, "numparent", SOURCE_OBJ, FIELD_ULONG },
     -+	{ ATOM_OBJECT, "object", SOURCE_OBJ },
     -+	{ ATOM_TYPE, "type", SOURCE_OBJ },
     -+	{ ATOM_TAG, "tag", SOURCE_OBJ },
     -+	{ ATOM_AUTHOR, "author", SOURCE_OBJ },
     -+	{ ATOM_AUTHORNAME, "authorname", SOURCE_OBJ },
     -+	{ ATOM_AUTHOREMAIL, "authoremail", SOURCE_OBJ, FIELD_STR, person_email_atom_parser },
     -+	{ ATOM_AUTHORDATE, "authordate", SOURCE_OBJ, FIELD_TIME },
     -+	{ ATOM_COMMITTER, "committer", SOURCE_OBJ },
     -+	{ ATOM_COMMITTERNAME, "committername", SOURCE_OBJ },
     -+	{ ATOM_COMMITTEREMAIL, "committeremail", SOURCE_OBJ, FIELD_STR, person_email_atom_parser },
     -+	{ ATOM_COMMITTERDATE, "committerdate", SOURCE_OBJ, FIELD_TIME },
     -+	{ ATOM_TAGGER, "tagger", SOURCE_OBJ },
     -+	{ ATOM_TAGGERNAME, "taggername", SOURCE_OBJ },
     -+	{ ATOM_TAGGEREMAIL, "taggeremail", SOURCE_OBJ, FIELD_STR, person_email_atom_parser },
     -+	{ ATOM_TAGGERDATE, "taggerdate", SOURCE_OBJ, FIELD_TIME },
     -+	{ ATOM_CREATOR, "creator", SOURCE_OBJ },
     -+	{ ATOM_CREATORDATE, "creatordate", SOURCE_OBJ, FIELD_TIME },
     -+	{ ATOM_SUBJECT, "subject", SOURCE_OBJ, FIELD_STR, subject_atom_parser },
     -+	{ ATOM_BODY, "body", SOURCE_OBJ, FIELD_STR, body_atom_parser },
     -+	{ ATOM_TRAILERS, "trailers", SOURCE_OBJ, FIELD_STR, trailers_atom_parser },
     -+	{ ATOM_CONTENTS, "contents", SOURCE_OBJ, FIELD_STR, contents_atom_parser },
     -+	{ ATOM_UPSTREAM, "upstream", SOURCE_NONE, FIELD_STR, remote_ref_atom_parser },
     -+	{ ATOM_PUSH, "push", SOURCE_NONE, FIELD_STR, remote_ref_atom_parser },
     -+	{ ATOM_SYMREF, "symref", SOURCE_NONE, FIELD_STR, refname_atom_parser },
     -+	{ ATOM_FLAG, "flag", SOURCE_NONE },
     -+	{ ATOM_HEAD, "HEAD", SOURCE_NONE, FIELD_STR, head_atom_parser },
     -+	{ ATOM_COLOR, "color", SOURCE_NONE, FIELD_STR, color_atom_parser },
     -+	{ ATOM_WORKTREEPATH, "worktreepath", SOURCE_NONE },
     -+	{ ATOM_ALIGN, "align", SOURCE_NONE, FIELD_STR, align_atom_parser },
     -+	{ ATOM_END, "end", SOURCE_NONE },
     -+	{ ATOM_IF, "if", SOURCE_NONE, FIELD_STR, if_atom_parser },
     -+	{ ATOM_THEN, "then", SOURCE_NONE },
     -+	{ ATOM_ELSE, "else", SOURCE_NONE },
     ++	[ATOM_REFNAME] = { "refname", SOURCE_NONE, FIELD_STR, refname_atom_parser },
     ++	[ATOM_OBJECTTYPE] = { "objecttype", SOURCE_OTHER, FIELD_STR, objecttype_atom_parser },
     ++	[ATOM_OBJECTSIZE] = { "objectsize", SOURCE_OTHER, FIELD_ULONG, objectsize_atom_parser },
     ++	[ATOM_OBJECTNAME] = { "objectname", SOURCE_OTHER, FIELD_STR, oid_atom_parser },
     ++	[ATOM_DELTABASE] = { "deltabase", SOURCE_OTHER, FIELD_STR, deltabase_atom_parser },
     ++	[ATOM_TREE] = { "tree", SOURCE_OBJ, FIELD_STR, oid_atom_parser },
     ++	[ATOM_PARENT] = { "parent", SOURCE_OBJ, FIELD_STR, oid_atom_parser },
     ++	[ATOM_NUMPARENT] = { "numparent", SOURCE_OBJ, FIELD_ULONG },
     ++	[ATOM_OBJECT] = { "object", SOURCE_OBJ },
     ++	[ATOM_TYPE] = { "type", SOURCE_OBJ },
     ++	[ATOM_TAG] = { "tag", SOURCE_OBJ },
     ++	[ATOM_AUTHOR] = { "author", SOURCE_OBJ },
     ++	[ATOM_AUTHORNAME] = { "authorname", SOURCE_OBJ },
     ++	[ATOM_AUTHOREMAIL] = { "authoremail", SOURCE_OBJ, FIELD_STR, person_email_atom_parser },
     ++	[ATOM_AUTHORDATE] = { "authordate", SOURCE_OBJ, FIELD_TIME },
     ++	[ATOM_COMMITTER] = { "committer", SOURCE_OBJ },
     ++	[ATOM_COMMITTERNAME] = { "committername", SOURCE_OBJ },
     ++	[ATOM_COMMITTEREMAIL] = { "committeremail", SOURCE_OBJ, FIELD_STR, person_email_atom_parser },
     ++	[ATOM_COMMITTERDATE] = { "committerdate", SOURCE_OBJ, FIELD_TIME },
     ++	[ATOM_TAGGER] = { "tagger", SOURCE_OBJ },
     ++	[ATOM_TAGGERNAME] = { "taggername", SOURCE_OBJ },
     ++	[ATOM_TAGGEREMAIL] = { "taggeremail", SOURCE_OBJ, FIELD_STR, person_email_atom_parser },
     ++	[ATOM_TAGGERDATE] = { "taggerdate", SOURCE_OBJ, FIELD_TIME },
     ++	[ATOM_CREATOR] = { "creator", SOURCE_OBJ },
     ++	[ATOM_CREATORDATE] = { "creatordate", SOURCE_OBJ, FIELD_TIME },
     ++	[ATOM_SUBJECT] = { "subject", SOURCE_OBJ, FIELD_STR, subject_atom_parser },
     ++	[ATOM_BODY] = { "body", SOURCE_OBJ, FIELD_STR, body_atom_parser },
     ++	[ATOM_TRAILERS] = { "trailers", SOURCE_OBJ, FIELD_STR, trailers_atom_parser },
     ++	[ATOM_CONTENTS] = { "contents", SOURCE_OBJ, FIELD_STR, contents_atom_parser },
     ++	[ATOM_UPSTREAM] = { "upstream", SOURCE_NONE, FIELD_STR, remote_ref_atom_parser },
     ++	[ATOM_PUSH] = { "push", SOURCE_NONE, FIELD_STR, remote_ref_atom_parser },
     ++	[ATOM_SYMREF] = { "symref", SOURCE_NONE, FIELD_STR, refname_atom_parser },
     ++	[ATOM_FLAG] = { "flag", SOURCE_NONE },
     ++	[ATOM_HEAD] = { "HEAD", SOURCE_NONE, FIELD_STR, head_atom_parser },
     ++	[ATOM_COLOR] = { "color", SOURCE_NONE, FIELD_STR, color_atom_parser },
     ++	[ATOM_WORKTREEPATH] = { "worktreepath", SOURCE_NONE },
     ++	[ATOM_ALIGN] = { "align", SOURCE_NONE, FIELD_STR, align_atom_parser },
     ++	[ATOM_END] = { "end", SOURCE_NONE },
     ++	[ATOM_IF] = { "if", SOURCE_NONE, FIELD_STR, if_atom_parser },
     ++	[ATOM_THEN] = { "then", SOURCE_NONE },
     ++	[ATOM_ELSE] = { "else", SOURCE_NONE },
       	/*
       	 * Please update $__git_ref_fieldlist in git-completion.bash
       	 * when you add new atoms
     +@@ ref-filter.c: static int parse_ref_filter_atom(const struct ref_format *format,
     + 	atom_len = (arg ? arg : ep) - sp;
     + 
     + 	/* Is the atom a valid one? */
     +-	for (i = 0; i < ARRAY_SIZE(valid_atom); i++) {
     ++	for (i = ATOM_UNKNOWN + 1; i < ATOM_INVALID; i++) {
     + 		int len = strlen(valid_atom[i].name);
     + 		if (len == atom_len && !memcmp(valid_atom[i].name, sp, len))
     + 			break;
     + 	}
     + 
     +-	if (ARRAY_SIZE(valid_atom) <= i)
     ++	if (i == ATOM_INVALID)
     + 		return strbuf_addf_ret(err, -1, _("unknown field name: %.*s"),
     + 				       (int)(ep-atom), atom);
     + 	if (valid_atom[i].source != SOURCE_NONE && !have_git_dir())
      @@ ref-filter.c: static int parse_ref_filter_atom(const struct ref_format *format,
       	at = used_atom_cnt;
       	used_atom_cnt++;
       	REALLOC_ARRAY(used_atom, used_atom_cnt);
     -+	used_atom[at].atom_type = valid_atom[i].atom_type;
     ++	used_atom[at].atom_type = i;
       	used_atom[at].name = xmemdupz(atom, ep - atom);
       	used_atom[at].type = valid_atom[i].cmp_type;
       	used_atom[at].source = valid_atom[i].source;
     @@ ref-filter.c: static int parse_ref_filter_atom(const struct ref_format *format,
       	if (*atom == '*')
       		need_tagged = 1;
      -	if (!strcmp(valid_atom[i].name, "symref"))
     -+	if (valid_atom[i].atom_type == ATOM_SYMREF)
     ++	if (i == ATOM_SYMREF)
       		need_symref = 1;
       	return at;
       }

-- 
gitgitgadget