Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Update BnfImporter to also import basic paragraphs. #1874

Merged
merged 1 commit into from
Jan 2, 2025
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
243 changes: 228 additions & 15 deletions web/modules/custom/bnf/src/Services/BnfImporter.php
Original file line number Diff line number Diff line change
Expand Up @@ -4,12 +4,18 @@

use Drupal\bnf\BnfStateEnum;
use Drupal\bnf\Exception\AlreadyExistsException;
use Drupal\Core\Entity\EntityFieldManagerInterface;
use Drupal\Core\Entity\EntityTypeManagerInterface;
use Drupal\Core\StringTranslation\TranslationInterface;
use Drupal\field\Entity\FieldConfig;
use Drupal\field\Entity\FieldStorageConfig;
use Drupal\node\NodeInterface;
use Drupal\paragraphs\ParagraphInterface;
use GuzzleHttp\ClientInterface;
use Psr\Log\LoggerInterface;
use function Safe\json_decode;
use function Safe\parse_url;
use function Safe\preg_replace;

/**
* Service related to importing content from an external source.
Expand All @@ -20,46 +26,235 @@
*/
class BnfImporter {

const ALLOWED_PARAGRAPHS = [
'ParagraphTextBody' => 'text_body',
'ParagraphAccordion' => 'accordion',
];

/**
* Constructor.
*/
public function __construct(
protected ClientInterface $httpClient,
protected EntityFieldManagerInterface $entityFieldManager,
protected EntityTypeManagerInterface $entityTypeManager,
protected TranslationInterface $translation,
protected LoggerInterface $logger,
) {}

/**
* Importing a node from a GraphQL source endpoint.
* Loading the columns of a field, that we use to ask GraphQL for data.
*
* E.g. a WYSIWYG field will have both a "value" and a "format" that we want
* to pull out.
*
* @return mixed[]
* Return an array of fields, along with their column keys.
*/
public function importNode(string $uuid, string $endpointUrl, string $nodeType = 'article'): void {
$nodeStorage = $this->entityTypeManager->getStorage('node');
protected function getFieldColumns(string $entityType, string $bundle): array {
$values = [];
$fields = [];
$fieldDefinitions = $this->entityFieldManager->getFieldDefinitions($entityType, $bundle);

$existingNodes =
$nodeStorage->loadByProperties(['uuid' => $uuid]);
foreach ($fieldDefinitions as $fieldKey => $fieldDefinition) {
if ($fieldDefinition instanceof FieldConfig) {
$fields[] = $fieldKey;
}
}

if (!empty($existingNodes)) {
$this->logger->error(
'Cannot import @type @uuid from @url - Node already exists.',
['@type' => $nodeType, '@uuid' => $uuid, '@url' => $endpointUrl]
);
foreach ($fields as $fieldKey) {
$field = $this->entityTypeManager->getStorage('field_storage_config')->load("$entityType.$fieldKey");

throw new AlreadyExistsException('Cannot import node - already exists.');
if ($field instanceof FieldStorageConfig) {
$values[$fieldKey] = array_keys($field->getColumns());
}
}

// Example of GraphQL query: "nodeArticle".
$queryName = 'node' . ucfirst($nodeType);
return $values;
}

// For now, we only support the title of the nodes.
/**
* Builds the query used to get data from the source.
*/
public function getQuery(string $uuid, string $queryName): string {
// Start building the GraphQL query.
$query = <<<GRAPHQL
query {
$queryName(id: "$uuid") {
title
paragraphs {

GRAPHQL;

// Loop through allowed paragraphs and add their structures.
foreach (self::ALLOWED_PARAGRAPHS as $graphBundle => $drupalBundle) {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I'd suggest to fold this out in a helper method that deals with the "inside" of the paragraphs section.

I think at the end we'll end up with a getQuery that just calls getFields which recursively generates the needed GraphQL.

$query .= <<<GRAPHQL
... on $graphBundle {
__typename

GRAPHQL;

// Add field columns for the current paragraph type.
$fieldColumns = $this->getFieldColumns('paragraph', $drupalBundle);
foreach ($fieldColumns as $fieldKey => $columns) {
$fieldKey = $this->drupalFieldToGraphField($fieldKey);

$columnsString = implode("\r\n ", $columns);
$query .= <<<GRAPHQL
$fieldKey {
$columnsString
}

GRAPHQL;
}

// Close the paragraph type block.
$query .= <<<GRAPHQL
}

GRAPHQL;
}

// Close the paragraphs and main query block.
$query .= <<<GRAPHQL
}
}
}
GRAPHQL;

return $query;
}

/**
* Turn GraphQL field format (camelCase) to Drupal format (snake_case).
*/
protected function graphFieldToDrupalField(string $fieldKey): string {
// Prefix all capitalized letters with an underscore.
$fieldKey = preg_replace('/(?<!^)[A-Z]/', '_$0', $fieldKey);

// Lowercase everything.
$fieldKey = strtolower($fieldKey);

// Prefix with "field_".
return "field_$fieldKey";
}

/**
* Turn Drupal format (snake_case) to GraphQL field format (camelCase).
*/
protected function drupalFieldToGraphField(string $fieldKey): string {
// Remove 'field_' prefix, if it exists.
if (str_starts_with($fieldKey, 'field_')) {
$fieldKey = substr($fieldKey, strlen('field_'));
}

// Replace underscores with spaces.
$fieldKey = str_replace('_', ' ', $fieldKey);

// Convert the first character of each word to uppercase.
$fieldKey = ucwords($fieldKey);

// Remove all spaces.
$fieldKey = str_replace(' ', '', $fieldKey);

// Make first letter lowercase, to match camelCase.
return lcfirst($fieldKey);
}

/**
* Parses paragraphs from GraphQL node data into Drupal-compatible structures.
*
* @param mixed[] $nodeData
* The GraphQL node data containing paragraphs.
*
* @return mixed[]
* Array of paragraph values, that we can use to create paragraph entities.
*/
protected function parseGraphParagraphs(array $nodeData) {
$parsedParagraphs = [];

// Ensure paragraphs exist in the GraphQL response.
if (empty($nodeData['paragraphs'])) {
return $parsedParagraphs;
}

foreach ($nodeData['paragraphs'] as $paragraphData) {
$type = $paragraphData['__typename'] ?? '';

// Convert typename to Drupal paragraph bundle name.
$bundleName = self::ALLOWED_PARAGRAPHS[$type] ?? NULL;

if (empty($bundleName)) {
continue;
}

$paragraph = ['type' => $bundleName];

// Map fields dynamically.
foreach ($paragraphData as $key => $value) {
if ($key === '__typename') {
continue;
}

// Assume Drupal uses field names like "field_{key}".
$drupalFieldName = $this->graphFieldToDrupalField($key);
$paragraph[$drupalFieldName] = $value;
}

$parsedParagraphs[] = $paragraph;
}

return $parsedParagraphs;
}

/**
* Creating the paragraphs, that we will add to the nodes.
*
* @param mixed[] $nodeData
* The GraphQL node data containing paragraphs.
*
* @return \Drupal\paragraphs\ParagraphInterface[]
* The paragraph entities.
*/
protected function getParagraphs(array $nodeData): array {
$parsedParagraphs = $this->parseGraphParagraphs($nodeData);
$storage = $this->entityTypeManager->getStorage('paragraph');
$paragraphs = [];
foreach ($parsedParagraphs as $paragraphData) {
$paragraph = $storage->create($paragraphData);

if ($paragraph instanceof ParagraphInterface) {
$paragraph->save();
$paragraphs[] = $paragraph;
}
}

return $paragraphs;
}

/**
* Loading the node data from a GraphQL endpoint.
*
* @return mixed[]
* Array of node values, that we can use to create node entities.
*/
public function loadNodeData(string $uuid, string $endpointUrl, string $nodeType = 'article'): array {
$queryName = 'node' . ucfirst($nodeType);

$nodeStorage = $this->entityTypeManager->getStorage('node');

$existingNodes =
$nodeStorage->loadByProperties(['uuid' => $uuid]);

if (!empty($existingNodes)) {
$this->logger->error(
'Cannot import @type @uuid from @url - Node already exists.',
['@type' => $nodeType, '@uuid' => $uuid, '@url' => $endpointUrl]
);

throw new AlreadyExistsException('Cannot import node - already exists.');
}

if (!filter_var($endpointUrl, FILTER_VALIDATE_URL)) {
throw new \InvalidArgumentException('The provided callback URL is not valid.');
}
Expand All @@ -71,6 +266,8 @@ public function importNode(string $uuid, string $endpointUrl, string $nodeType =
throw new \InvalidArgumentException('The provided callback URL must use HTTPS.');
}

$query = $this->getQuery($uuid, $queryName);

$response = $this->httpClient->request('post', $endpointUrl, [
'headers' => [
'Content-Type' => 'application/json',
Expand All @@ -87,15 +284,30 @@ public function importNode(string $uuid, string $endpointUrl, string $nodeType =
$nodeData = $data['data'][$queryName] ?? NULL;

if (empty($nodeData)) {
$this->logger->error('Could not find any node data in GraphQL response.');
$this->logger->error(
'Could not find any node data in GraphQL response. @query',
['@query' => $query]
);

throw new \Exception('Could not retrieve content values.');
}
return $nodeData;

}

/**
* Importing a node from a GraphQL source endpoint.
*/
public function importNode(string $uuid, string $endpointUrl, string $nodeType = 'article'): NodeInterface {
$nodeStorage = $this->entityTypeManager->getStorage('node');
try {
$nodeData = $this->loadNodeData($uuid, $endpointUrl, $nodeType);
$nodeData['type'] = $nodeType;
$nodeData['uuid'] = $uuid;
$nodeData['field_paragraphs'] = $this->getParagraphs($nodeData);
$nodeData['status'] = NodeInterface::NOT_PUBLISHED;

/** @var \Drupal\node\NodeInterface $node */
$node = $nodeStorage->create($nodeData);
$node->save();

Expand All @@ -116,6 +328,7 @@ public function importNode(string $uuid, string $endpointUrl, string $nodeType =
'@type' => $nodeType,
]);

return $node;
}

}
Loading