kwin commented on a change in pull request #74:
URL: 
https://github.com/apache/sling-org-apache-sling-feature-cpconverter/pull/74#discussion_r615275995



##########
File path: 
src/main/java/org/apache/sling/feature/cpconverter/handlers/BundleEntryHandler.java
##########
@@ -108,111 +141,293 @@ public void handle(@NotNull String path, @NotNull 
Archive archive, @NotNull Entr
             logger.debug("Start level {} was extracted from path {}", 
startLevel, path);
         }
 
-        try (JarInputStream jarInput = new 
JarInputStream(Objects.requireNonNull(archive.openInputStream(entry)))) {
-            Properties properties = readGav(entry.getName(), jarInput);
-            manifest = jarInput.getManifest();
-
-            if (!properties.isEmpty()) {
-                groupId = getCheckedProperty(properties, NAME_GROUP_ID);
-                artifactId = getCheckedProperty(properties, NAME_ARTIFACT_ID);
-                version = getCheckedProperty(properties, NAME_VERSION);
-                classifier = properties.getProperty(NAME_CLASSIFIER);
-            } else { // maybe the included jar is just an OSGi bundle but not 
a valid Maven artifact
-                groupId = getCheckedProperty(manifest, BUNDLE_SYMBOLIC_NAME);
-                // Make sure there are not spaces in the name to adhere to the 
Maven Group Id specification
-                groupId = groupId.replace(' ', '_').replace(':', 
'_').replace('/', '_').replace('\\', '_');
-                if (groupId.indexOf('.') != -1) {
-                    artifactId = groupId.substring(groupId.lastIndexOf('.') + 
1);
-                    groupId = groupId.substring(0, groupId.lastIndexOf('.'));
-                }
-                if (artifactId == null || artifactId.isEmpty()) {
-                    artifactId = groupId;
+        String bundleName = entry.getName();
+        // Remove the leading path
+        int idx = bundleName.lastIndexOf('/');
+        if (idx >= 0) {
+            bundleName = bundleName.substring(idx + 1);
+        }
+        // Remove the extension
+        int edx = bundleName.lastIndexOf('.');
+        if (edx > 0) {
+            bundleName = bundleName.substring(0, edx);
+        }
+        
+        // create a temporary JAR file (extracted from archive)
+        Path tmpBundleJar = 
Files.createTempFile(converter.getTempDirectory().toPath(), "extracted", 
bundleName + ".jar");
+        try (OutputStream output = Files.newOutputStream(tmpBundleJar);
+             InputStream input = 
Objects.requireNonNull(archive.openInputStream(entry))) {
+            IOUtils.copy(input, output);
+        }
+        
+        try (JarFile jarFile = new JarFile(tmpBundleJar.toFile())) {
+            // first extract bundle metadata from JAR input stream
+            ArtifactId id = extractArtifactId(bundleName, jarFile);
+
+            try (InputStream strippedBundleInput = extractInitialContent(id, 
jarFile, converter, runMode)) {
+                
Objects.requireNonNull(converter.getArtifactsDeployer()).deploy(new 
InputStreamArtifactWriter(strippedBundleInput), id);
+                
Objects.requireNonNull(converter.getFeaturesManager()).addArtifact(runMode, id, 
startLevel);
+
+                String exportHeader = 
Objects.requireNonNull(jarFile.getManifest()).getMainAttributes().getValue(Constants.EXPORT_PACKAGE);
+                if (exportHeader != null) {
+                    for (Clause clause : Parser.parseHeader(exportHeader)) {
+                        
converter.getFeaturesManager().addAPIRegionExport(runMode, clause.getName());
+                    }
                 }
-                Version osgiVersion = 
Version.parseVersion(getCheckedProperty(manifest, BUNDLE_VERSION));
-                version = osgiVersion.getMajor() + "." + 
osgiVersion.getMinor() + "." + osgiVersion.getMicro() + 
(osgiVersion.getQualifier().isEmpty() ? "" : "-" + osgiVersion.getQualifier());
             }
+        } finally {
+            Files.delete(tmpBundleJar);
         }
+    }
 
-        try (InputStream input = archive.openInputStream(entry)) {
-            if (input != null) {
-                ArtifactId id = new ArtifactId(groupId, artifactId, version, 
classifier, JAR_TYPE);
+    @NotNull InputStream extractInitialContent(@NotNull ArtifactId 
bundleArtifactId, @NotNull JarFile jarFile, @NotNull 
ContentPackage2FeatureModelConverter converter, @Nullable String runMode) 
throws Exception {
+        // parse "Sling-Initial-Content" header
+        Manifest manifest = Objects.requireNonNull(jarFile.getManifest());
+        Iterator<PathEntry> pathEntries = PathEntry.getContentPaths(manifest, 
-1);
+        if (pathEntries == null) {
+            return new FileInputStream(jarFile.getName());
+        }
+        logger.info("Extracting Sling-Initial-Content from '{}'", 
bundleArtifactId);
+        Collection<PathEntry> pathEntryList = new ArrayList<>();
+        pathEntries.forEachRemaining(pathEntryList::add);
+
+        // remove header
+        manifest.getMainAttributes().remove(new 
Attributes.Name(PathEntry.CONTENT_HEADER));
+        Path newBundleFile = 
Files.createTempFile(converter.getTempDirectory().toPath(), "newBundle", 
".jar");
+        
+        // create JAR file to prevent extracting it twice and for random access
+        JcrNamespaceRegistry namespaceRegistry = 
createNamespaceRegistry(manifest, jarFile);
+        
+        Map<PackageType, VaultPackageAssembler> packageAssemblers = new 
EnumMap<>(PackageType.class);
+        try (OutputStream fileOutput = Files.newOutputStream(newBundleFile, 
StandardOpenOption.WRITE, StandardOpenOption.TRUNCATE_EXISTING);
+            JarOutputStream bundleOutput = new JarOutputStream(fileOutput, 
manifest)) {
+            
+            for (Enumeration<JarEntry> e = jarFile.entries(); 
e.hasMoreElements();) {
+                JarEntry jarEntry = e.nextElement();
+                if (!jarEntry.isDirectory()) {
+                    try (InputStream input = jarFile.getInputStream(jarEntry)) 
{
+                        if (!extractInitialContent(jarEntry, input, 
bundleArtifactId, pathEntryList, packageAssemblers, namespaceRegistry, 
converter)) {
+                            // skip manifest, as already written in the 
constructor (as first entry)
+                            if 
(jarEntry.getName().equals(JarFile.MANIFEST_NAME)) {
+                                continue;
+                            }
+                            // copy entry as is to the stripped bundle
+                            ZipEntry ze = new ZipEntry(jarEntry.getName());
+                            bundleOutput.putNextEntry(ze);
+                            IOUtils.copy(input, bundleOutput);
+                            bundleOutput.closeEntry();
+                        }
+                    }
+                }
+            }
+        }
+        // add additional content packages to feature model
+        finalizePackageAssembly(packageAssemblers, converter, runMode);
+        
+        // return stripped bundle's inputstream which must be deleted on close
+        return Files.newInputStream(newBundleFile, StandardOpenOption.READ, 
StandardOpenOption.DELETE_ON_CLOSE);
+    }
 
-                
Objects.requireNonNull(converter.getArtifactsDeployer()).deploy(new 
InputStreamArtifactWriter(input), id);
+    /**
+     * 
+     * @param jarEntry
+     * @param bundleFileInputStream
+     * @param pathEntriesStream
+     * @param packageAssemblers
+     * @param converter
+     * @return {@code true} in case the given entry was part of the initial 
content otherwise {@code false}
+     * @throws Exception 
+     */
+    boolean extractInitialContent(@NotNull JarEntry jarEntry, @NotNull 
InputStream bundleFileInputStream, @NotNull ArtifactId bundleArtifactId, 
@NotNull Collection<PathEntry> pathEntries, @NotNull Map<PackageType, 
VaultPackageAssembler> packageAssemblers, @NotNull JcrNamespaceRegistry 
nsRegistry, @NotNull ContentPackage2FeatureModelConverter converter) throws 
Exception {
+        final String entryName = jarEntry.getName();
+        // check if current JAR entry is initial content
+        Optional<PathEntry> pathEntry = pathEntries.stream().filter(p -> 
entryName.startsWith(p.getPath())).findFirst();
+        if (!pathEntry.isPresent()) {
+            return false;
+        }
+        ContentParser contentParser = getContentParserForEntry(jarEntry, 
pathEntry.get());
+
+        // 
https://sling.apache.org/documentation/bundles/content-loading-jcr-contentloader.html#file-name-escaping
+        String repositoryPath = (pathEntry.get().getTarget() != null ? 
pathEntry.get().getTarget() : "/") + 
URLDecoder.decode(entryName.substring(pathEntry.get().getPath().length()), 
"UTF-8");
+        String contentPackagePath = 
org.apache.jackrabbit.vault.util.Constants.ROOT_DIR + 
PlatformNameFormat.getPlatformPath(repositoryPath);
+
+        // in which content package should this end up?
+        VaultPackageAssembler packageAssembler = 
initPackageAssemblerForPath(bundleArtifactId, repositoryPath, 
packageAssemblers, converter);
+        Path tmpInputFile = null;
+        if (contentParser != null) {
+            // convert to docview xml
+            tmpInputFile = 
Files.createTempFile(converter.getTempDirectory().toPath(), "docview", ".xml");
+            try (OutputStream docViewOutput = 
Files.newOutputStream(tmpInputFile, StandardOpenOption.WRITE, 
StandardOpenOption.TRUNCATE_EXISTING);
+                 DocViewSerializerContentHandler contentHandler = new 
DocViewSerializerContentHandler(docViewOutput, nsRegistry)) {
+                contentParser.parse(contentHandler, bundleFileInputStream, new 
ParserOptions());
+                contentPackagePath = 
FilenameUtils.removeExtension(contentPackagePath) + ".xml";
+            } catch (IOException e) {
+                throw new IOException("Can not parse " + jarEntry, e);
+            } catch (DocViewSerializerContentHandlerException e) {
+                throw new IOException("Can not convert " + jarEntry + " to 
enhanced DocView format", e);
+            }
+        }
 
-                
Objects.requireNonNull(converter.getFeaturesManager()).addArtifact(runMode, id, 
startLevel);
+        // does entry in initial content need to be extracted into feature 
model (e.g. for OSGi configurations)
+        EntryHandler entryHandler = 
converter.getHandlersManager().getEntryHandlerByEntryPath(contentPackagePath);
+        if (entryHandler != null) {
+            if (tmpInputFile == null) {
+                tmpInputFile = 
Files.createTempFile(converter.getTempDirectory().toPath(), "initial-content", 
Text.getName(jarEntry.getName()));
+                try (OutputStream tmpBundleOutput = 
Files.newOutputStream(tmpInputFile, StandardOpenOption.WRITE, 
StandardOpenOption.TRUNCATE_EXISTING)) {
+                    IOUtils.copy(bundleFileInputStream, tmpBundleOutput);
+                }
+            }
+            // TODO: map path to imitate content-package structure
+            SingleFileArchive archive = new 
SingleFileArchive(tmpInputFile.toFile(), contentPackagePath);
+            entryHandler.handle(repositoryPath, archive, archive.getRoot(), 
converter);
+            Files.delete(tmpInputFile);
+        } else {
+            // ... otherwise add it to the content package
+            if (tmpInputFile != null) {
+                packageAssembler.addEntry(contentPackagePath, 
tmpInputFile.toFile());
+                Files.delete(tmpInputFile);
+            } else {
+                packageAssembler.addEntry(contentPackagePath, 
bundleFileInputStream);
+            }
+        }
+        return true;
+    }
 
-                String epHeader = 
manifest.getMainAttributes().getValue(Constants.EXPORT_PACKAGE);
-                if (epHeader != null) {
-                    for (Clause clause : Parser.parseHeader(epHeader)) {
-                        
converter.getFeaturesManager().addAPIRegionExport(runMode, clause.getName());
+    JcrNamespaceRegistry createNamespaceRegistry(@NotNull Manifest manifest, 
@NotNull JarFile jarFile) throws RepositoryException, IOException, 
ParseException {
+        JcrNamespaceRegistry registry = new JcrNamespaceRegistry();
+        // configured CND
+        
+        // parse Sling-Namespaces header 
(https://github.com/apache/sling-org-apache-sling-jcr-base/blob/66be360910c265473799635fcac0e23895898913/src/main/java/org/apache/sling/jcr/base/internal/loader/Loader.java#L192)
+        final String namespaceDefinition = 
manifest.getMainAttributes().getValue(NAMESPACES_BUNDLE_HEADER);
+        if (namespaceDefinition != null) {
+            final StringTokenizer st = new 
StringTokenizer(namespaceDefinition, ",");
+
+            while ( st.hasMoreTokens() ) {
+                final String token = st.nextToken().trim();
+                int pos = token.indexOf('=');
+                if ( pos == -1 ) {
+                    logger.warn("createNamespaceRegistry: Bundle {} has an 
invalid namespace manifest header entry: {}",
+                            
manifest.getMainAttributes().getValue(Constants.BUNDLE_SYMBOLICNAME), token);
+                } else {
+                    final String prefix = token.substring(0, pos).trim();
+                    final String namespace = token.substring(pos+1).trim();
+                    registry.registerNamespace(prefix, namespace);
+                }
+            }
+        }
+        
+        // parse Sling-Nodetypes header
+        final String typesHeader = 
manifest.getMainAttributes().getValue(NODETYPES_BUNDLE_HEADER);
+        if (typesHeader != null) {
+            StringTokenizer tokener = new StringTokenizer(typesHeader, ",");

Review comment:
       Good idea, will change that. Just copied the code over from 
https://github.com/apache/sling-org-apache-sling-jcr-base/blob/66be360910c265473799635fcac0e23895898913/src/main/java/org/apache/sling/jcr/base/internal/loader/Loader.java#L192
 and 
https://github.com/apache/sling-org-apache-sling-jcr-base/blob/66be360910c265473799635fcac0e23895898913/src/main/java/org/apache/sling/jcr/base/internal/loader/Loader.java#L242




-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


Reply via email to