|
|
|
#ifndef SUBMODULE_CONFIG_CACHE_H
|
|
|
|
#define SUBMODULE_CONFIG_CACHE_H
|
|
|
|
|
|
|
|
#include "cache.h"
|
|
|
|
#include "config.h"
|
|
|
|
#include "hashmap.h"
|
|
|
|
#include "submodule.h"
|
|
|
|
#include "strbuf.h"
|
|
|
|
|
|
|
|
/**
|
|
|
|
* The submodule config cache API allows to read submodule
|
|
|
|
* configurations/information from specified revisions. Internally
|
|
|
|
* information is lazily read into a cache that is used to avoid
|
|
|
|
* unnecessary parsing of the same .gitmodules files. Lookups can be done by
|
|
|
|
* submodule path or name.
|
|
|
|
*
|
|
|
|
* Usage
|
|
|
|
* -----
|
|
|
|
*
|
|
|
|
* The caller can look up information about submodules by using the
|
|
|
|
* `submodule_from_path()` or `submodule_from_name()` functions. They return
|
|
|
|
* a `struct submodule` which contains the values. The API automatically
|
|
|
|
* initializes and allocates the needed infrastructure on-demand. If the
|
|
|
|
* caller does only want to lookup values from revisions the initialization
|
|
|
|
* can be skipped.
|
|
|
|
*
|
|
|
|
* If the internal cache might grow too big or when the caller is done with
|
|
|
|
* the API, all internally cached values can be freed with submodule_free().
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Submodule entry containing the information about a certain submodule
|
|
|
|
* in a certain revision. It is returned by the lookup functions.
|
|
|
|
*/
|
|
|
|
struct submodule {
|
|
|
|
const char *path;
|
|
|
|
const char *name;
|
|
|
|
const char *url;
|
|
|
|
int fetch_recurse;
|
|
|
|
const char *ignore;
|
|
|
|
const char *branch;
|
|
|
|
struct submodule_update_strategy update_strategy;
|
|
|
|
/* the object id of the responsible .gitmodules file */
|
|
|
|
struct object_id gitmodules_oid;
|
|
|
|
int recommend_shallow;
|
|
|
|
};
|
|
|
|
|
|
|
|
#define SUBMODULE_INIT { NULL, NULL, NULL, RECURSE_SUBMODULES_NONE, \
|
|
|
|
NULL, NULL, SUBMODULE_UPDATE_STRATEGY_INIT, { { 0 } }, -1 };
|
|
|
|
|
|
|
|
struct submodule_cache;
|
|
|
|
struct repository;
|
|
|
|
|
|
|
|
void submodule_cache_free(struct submodule_cache *cache);
|
|
|
|
|
|
|
|
int parse_submodule_fetchjobs(const char *var, const char *value);
|
|
|
|
int parse_fetch_recurse_submodules_arg(const char *opt, const char *arg);
|
|
|
|
struct option;
|
|
|
|
int option_fetch_parse_recurse_submodules(const struct option *opt,
|
|
|
|
const char *arg, int unset);
|
|
|
|
int parse_update_recurse_submodules_arg(const char *opt, const char *arg);
|
|
|
|
int parse_push_recurse_submodules_arg(const char *opt, const char *arg);
|
|
|
|
void repo_read_gitmodules(struct repository *repo, int skip_if_read);
|
|
|
|
void gitmodules_config_oid(const struct object_id *commit_oid);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Same as submodule_from_path but lookup by name.
|
|
|
|
*/
|
|
|
|
const struct submodule *submodule_from_name(struct repository *r,
|
|
|
|
const struct object_id *commit_or_tree,
|
|
|
|
const char *name);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Given a tree-ish in the superproject and a path, return the submodule that
|
|
|
|
* is bound at the path in the named tree.
|
|
|
|
*/
|
|
|
|
const struct submodule *submodule_from_path(struct repository *r,
|
|
|
|
const struct object_id *commit_or_tree,
|
|
|
|
const char *path);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Use these to free the internally cached values.
|
|
|
|
*/
|
|
|
|
void submodule_free(struct repository *r);
|
|
|
|
|
|
|
|
int print_config_from_gitmodules(struct repository *repo, const char *key);
|
|
|
|
int config_set_in_gitmodules_file_gently(const char *key, const char *value);
|
|
|
|
|
submodule-config: verify submodule names as paths
Submodule "names" come from the untrusted .gitmodules file,
but we blindly append them to $GIT_DIR/modules to create our
on-disk repo paths. This means you can do bad things by
putting "../" into the name (among other things).
Let's sanity-check these names to avoid building a path that
can be exploited. There are two main decisions:
1. What should the allowed syntax be?
It's tempting to reuse verify_path(), since submodule
names typically come from in-repo paths. But there are
two reasons not to:
a. It's technically more strict than what we need, as
we really care only about breaking out of the
$GIT_DIR/modules/ hierarchy. E.g., having a
submodule named "foo/.git" isn't actually
dangerous, and it's possible that somebody has
manually given such a funny name.
b. Since we'll eventually use this checking logic in
fsck to prevent downstream repositories, it should
be consistent across platforms. Because
verify_path() relies on is_dir_sep(), it wouldn't
block "foo\..\bar" on a non-Windows machine.
2. Where should we enforce it? These days most of the
.gitmodules reads go through submodule-config.c, so
I've put it there in the reading step. That should
cover all of the C code.
We also construct the name for "git submodule add"
inside the git-submodule.sh script. This is probably
not a big deal for security since the name is coming
from the user anyway, but it would be polite to remind
them if the name they pick is invalid (and we need to
expose the name-checker to the shell anyway for our
test scripts).
This patch issues a warning when reading .gitmodules
and just ignores the related config entry completely.
This will generally end up producing a sensible error,
as it works the same as a .gitmodules file which is
missing a submodule entry (so "submodule update" will
barf, but "git clone --recurse-submodules" will print
an error but not abort the clone.
There is one minor oddity, which is that we print the
warning once per malformed config key (since that's how
the config subsystem gives us the entries). So in the
new test, for example, the user would see three
warnings. That's OK, since the intent is that this case
should never come up outside of malicious repositories
(and then it might even benefit the user to see the
message multiple times).
Credit for finding this vulnerability and the proof of
concept from which the test script was adapted goes to
Etienne Stalmans.
Signed-off-by: Jeff King <peff@peff.net>
7 years ago
|
|
|
/*
|
|
|
|
* Returns 0 if the name is syntactically acceptable as a submodule "name"
|
|
|
|
* (e.g., that may be found in the subsection of a .gitmodules file) and -1
|
|
|
|
* otherwise.
|
|
|
|
*/
|
|
|
|
int check_submodule_name(const char *name);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Note: these helper functions exist solely to maintain backward
|
|
|
|
* compatibility with 'fetch' and 'update_clone' storing configuration in
|
|
|
|
* '.gitmodules'.
|
|
|
|
*
|
|
|
|
* New helpers to retrieve arbitrary configuration from the '.gitmodules' file
|
|
|
|
* should NOT be added.
|
|
|
|
*/
|
|
|
|
void fetch_config_from_gitmodules(int *max_children, int *recurse_submodules);
|
|
|
|
void update_clone_config_from_gitmodules(int *max_jobs);
|
|
|
|
|
|
|
|
#endif /* SUBMODULE_CONFIG_H */
|