Skip to content

Commit

Permalink
Never export monikers for the JDK except when indexin the JDK
Browse files Browse the repository at this point in the history
Previously, there was a small risk that lsif-java would export symbols
against the JDK when indexing non-JDK packages like
com.google.gwt:gwt-user:2.9.0, which contain source files for
`java.lang.String` but don't define `java/lang/String.class`.

This commit, adds a special case for the JDK so that monikers for JDK
symbols are always imported when indexing non-JDK repos.
  • Loading branch information
olafurpg committed May 19, 2021
1 parent 4c8f2e6 commit 543fb44
Show file tree
Hide file tree
Showing 8 changed files with 44 additions and 18 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,7 @@ abstract class BuildTool(val name: String, index: IndexCommand) {
protected def defaultTargetroot: Path

def isHidden: Boolean = false
def buildKind: String = ""

final def sourceroot: Path = index.workingDirectory
final def targetroot: Path =
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -54,6 +54,8 @@ class LsifBuildTool(index: IndexCommand) extends BuildTool("LSIF", index) {
index.workingDirectory.resolve(LsifBuildTool.ConfigFileName)
def usedInCurrentDirectory(): Boolean = Files.isRegularFile(configFile)
override def isHidden: Boolean = true
override def buildKind: String =
parsedConfig.fold(_.kind, _ => super.buildKind)
def generateSemanticdb(): CommandResult = {
parsedConfig match {
case ValueResult(value) =>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -160,6 +160,7 @@ case class IndexCommand(
output = finalOutput,
targetroot = List(tool.targetroot),
packagehub = packagehub,
buildKind = tool.buildKind,
app = app
).run()
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,9 @@ final case class IndexSemanticdbCommand(
packagehub: Option[String] = None,
@Description("Directories that contain SemanticDB files.")
@PositionalArguments() targetroot: List[Path] = Nil,
@Description(
"The kind of this build, one of: empty string, jdk, maven"
) buildKind: String = "",
@Inline() app: Application = Application.default
) extends Command {
def sourceroot: Path = AbsolutePath.of(app.env.workingDirectory)
Expand Down Expand Up @@ -72,7 +75,8 @@ final case class IndexSemanticdbCommand(
"java",
format,
parallel,
packages.map(_.toPackageInformation).asJava
packages.map(_.toPackageInformation).asJava,
buildKind
)
LsifSemanticdb.run(options)
postPackages(packages)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -97,7 +97,7 @@ private Integer processDocument(
.collect(Collectors.toSet());
doc.id = documentId;
ResultSets results =
new ResultSets(writer, globals, isExportedSymbol, localDefinitions, packages);
new ResultSets(writer, globals, isExportedSymbol, localDefinitions, packages, options);
Set<Integer> rangeIds = new LinkedHashSet<>();

for (SymbolOccurrence occ : doc.sortedSymbolOccurrences()) {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@ public class LsifSemanticdbOptions {
public final LsifOutputFormat format;
public final boolean parallel;
public final List<MavenPackage> packages;
public final String buildKind;

public LsifSemanticdbOptions(
List<Path> targetroots,
Expand All @@ -26,7 +27,8 @@ public LsifSemanticdbOptions(
String language,
LsifOutputFormat format,
boolean parallel,
List<MavenPackage> packages) {
List<MavenPackage> packages,
String buildKind) {
this.targetroots = targetroots;
this.output = output;
this.sourceroot = sourceroot;
Expand All @@ -36,5 +38,6 @@ public LsifSemanticdbOptions(
this.format = format;
this.parallel = parallel;
this.packages = packages;
this.buildKind = buildKind;
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -46,23 +46,16 @@ public PackageTable(LsifSemanticdbOptions options, LsifWriter writer) throws IOE
}
}

public void writeImportedSymbol(String symbol, int monikerId) {
packageForSymbol(symbol)
.ifPresent(
pkg -> {
int pkgId = lsif.computeIfAbsent(pkg, this);
writer.emitPackageInformationEdge(monikerId, pkgId);
});
public void writeMonikerPackage(int monikerId, Package pkg) {
int pkgId = lsif.computeIfAbsent(pkg, this);
writer.emitPackageInformationEdge(monikerId, pkgId);
}

private Optional<Package> packageForClassfile(String classfile) {
Package result = byClassfile.get(classfile);
if (result != null) return Optional.of(result);
if (!javaVersion.isJava8 && isJrtClassfile(classfile)) return Optional.of(javaVersion.pkg);
return Optional.empty();
public void writeImportedSymbol(String symbol, int monikerId) {
packageForSymbol(symbol).ifPresent(pkg -> writeMonikerPackage(monikerId, pkg));
}

private Optional<Package> packageForSymbol(String symbol) {
public Optional<Package> packageForSymbol(String symbol) {
return SymbolDescriptor.toplevel(symbol)
.flatMap(
toplevel -> {
Expand All @@ -71,6 +64,13 @@ private Optional<Package> packageForSymbol(String symbol) {
});
}

private Optional<Package> packageForClassfile(String classfile) {
Package result = byClassfile.get(classfile);
if (result != null) return Optional.of(result);
if (!javaVersion.isJava8 && isJrtClassfile(classfile)) return Optional.of(javaVersion.pkg);
return Optional.empty();
}

private void indexPackage(MavenPackage pkg) throws IOException {
if (!JAR_PATTERN.matches(pkg.jar)) {
return;
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,7 @@
import com.sourcegraph.semanticdb_javac.SemanticdbSymbols;
import java.util.HashMap;
import java.util.Map;
import java.util.Optional;
import java.util.Set;
import java.util.function.Function;

Expand All @@ -15,18 +16,21 @@ public class ResultSets implements Function<String, ResultIds> {
private final Set<String> exportedSymbols;
private final Set<String> localDefinitions;
private final PackageTable packages;
private final boolean isJdkRepo;

public ResultSets(
LsifWriter writer,
Map<String, ResultIds> globals,
Set<String> exportedSymbols,
Set<String> localDefinitions,
PackageTable packages) {
PackageTable packages,
LsifSemanticdbOptions options) {
this.writer = writer;
this.globals = globals;
this.exportedSymbols = exportedSymbols;
this.localDefinitions = localDefinitions;
this.packages = packages;
this.isJdkRepo = options.buildKind.equals("jdk");
locals = new HashMap<>();
}

Expand All @@ -43,9 +47,20 @@ public ResultIds apply(String symbol) {
int resultSet = writer.emitResultSet();

// Moniker
Optional<Package> pkg = packages.packageForSymbol(symbol);
if (pkg.isPresent() && pkg.get() instanceof JdkPackage && !isJdkRepo) {
// Never export monikers for the JDK repo unless we're indexing the JDK repo.
// Some Maven packages contain sources that redefine symbols like `java/lang/String#`
// even if the the jar files don't contain `java/lang/String.class`. For example,
// see the package com.google.gwt:gwt-user:2.9.0.
// Related issue: https://github.com/sourcegraph/sourcegraph/issues/21058
isExportedSymbol = false;
}
int monikerId = writer.emitMonikerVertex(symbol, hasDefinitionResult);
writer.emitMonikerEdge(resultSet, monikerId);
packages.writeImportedSymbol(symbol, monikerId);
if (pkg.isPresent()) {
packages.writeMonikerPackage(monikerId, pkg.get());
}

int definitionId = hasDefinitionResult ? writer.emitDefinitionResult(resultSet) : -1;

Expand Down

0 comments on commit 543fb44

Please sign in to comment.