Translate extension for MediaWiki
 
Loading...
Searching...
No Matches
CsvTranslationImporter.php
1<?php
2declare( strict_types = 1 );
3
4namespace MediaWiki\Extension\Translate\MessageGroupProcessing;
5
6use MediaWiki\CommentStore\CommentStoreComment;
7use MediaWiki\Content\ContentHandler;
10use MediaWiki\Page\WikiPageFactory;
11use MediaWiki\Permissions\Authority;
12use MediaWiki\Revision\SlotRecord;
13use MediaWiki\Status\Status;
14use MediaWiki\Title\Title;
15use SplFileObject;
16
24 private WikiPageFactory $wikiPageFactory;
25
26 public function __construct( WikiPageFactory $wikiPageFactory ) {
27 $this->wikiPageFactory = $wikiPageFactory;
28 }
29
31 public function parseFile( string $csvFilePath ): Status {
32 if ( !file_exists( $csvFilePath ) || !is_file( $csvFilePath ) ) {
33 return Status::newFatal(
34 "CSV file path '$csvFilePath' does not exist, is not readable or is not a file"
35 );
36 }
37
38 $indexedLanguageCodes = [];
39 $currentRowCount = -1;
40 $importData = [];
41 $invalidRows = [
42 'emptyTitleRows' => [],
43 'invalidTitleRows' => [],
44 'groupNotFoundRows' => []
45 ];
46
47 $csvFileContent = new SplFileObject( $csvFilePath, 'r' );
48 while ( !$csvFileContent->eof() ) {
49 // Increment the row count at the beginning since we have a bunch of jump statements
50 // at various placaes
51 ++$currentRowCount;
52
53 $csvRow = $csvFileContent->fgetcsv( ',', '"', "\\" );
54 if ( $this->isCsvRowEmpty( $csvRow ) ) {
55 continue;
56 }
57
58 if ( $currentRowCount === 0 ) {
59 // Validate the header
60 $status = $this->getLanguagesFromHeader( $csvRow );
61 if ( !$status->isGood() ) {
62 return $status;
63 }
65 $indexedLanguageCodes = $status->getValue();
66 continue;
67 }
68
69 $rowData = [ 'translations' => [] ];
70 $messageTitle = isset( $csvRow[0] ) ? trim( $csvRow[0] ) : null;
71 if ( !$messageTitle ) {
72 $invalidRows['emptyTitleRows'][] = $currentRowCount + 1;
73 continue;
74 }
75
76 $handle = $this->getMessageHandleIfValid( $messageTitle );
77 if ( $handle === null ) {
78 $invalidRows['invalidTitleRows'][] = $currentRowCount + 1;
79 continue;
80 }
81
82 // Ensure that the group is present
83 $group = $handle->getGroup();
84 if ( !$group ) {
85 $invalidRows['groupNotFoundRows'][] = $currentRowCount + 1;
86 continue;
87 }
88
89 $sourceLanguage = $group->getSourceLanguage();
90
91 $rowData['messageTitle'] = $messageTitle;
92 foreach ( $indexedLanguageCodes as $languageCode => $index ) {
93 if ( $sourceLanguage === $languageCode ) {
94 continue;
95 }
96
97 $rowData['translations'][$languageCode] = $csvRow[$index] ?? null;
98 }
99 $importData[] = $rowData;
100 }
101
102 $status = new Status();
103 if ( $invalidRows['emptyTitleRows'] ) {
104 $status->fatal(
105 'Empty message titles found on row(s): ' . implode( ',', $invalidRows['emptyTitleRows'] )
106 );
107 }
108
109 if ( $invalidRows['invalidTitleRows'] ) {
110 $status->fatal(
111 'Invalid message title(s) found on row(s): ' . implode( ',', $invalidRows['invalidTitleRows'] )
112 );
113 }
114
115 if ( $invalidRows['groupNotFoundRows'] ) {
116 $status->fatal(
117 'Group not found for message(s) on row(s) ' . implode( ',', $invalidRows['invalidTitleRows'] )
118 );
119 }
120
121 if ( !$status->isGood() ) {
122 return $status;
123 }
124
125 return Status::newGood( $importData );
126 }
127
129 public function importData(
130 array $messagesWithTranslations,
131 Authority $authority,
132 string $comment,
133 ?callable $progressReporter = null
134 ): Status {
135 $commentStoreComment = CommentStoreComment::newUnsavedComment( $comment );
136
137 // Loop over each translation to import
138 $importStatus = new Status();
139 $failedStatuses = [];
140 $currentTranslation = 0;
141 foreach ( $messagesWithTranslations as $messageTranslation ) {
142 $messageTitleText = $messageTranslation['messageTitle'];
143 $messageTitle = Title::newFromText( $messageTitleText );
144 $messageHandle = new MessageHandle( $messageTitle );
145
146 $translationImportStatuses = [];
147
148 // Import each translation for the current message
149 $translations = $messageTranslation['translations'];
150 foreach ( $translations as $languageCode => $translation ) {
151 // Skip empty translations
152 if ( $translation === null || trim( $translation ) === '' ) {
153 continue;
154 }
155
156 $translationTitle = $messageHandle->getTitleForLanguage( $languageCode );
157
158 // Perform the update for the translation page
159 $updater = $this->wikiPageFactory->newFromTitle( $translationTitle )
160 ->newPageUpdater( $authority );
161 $content = ContentHandler::makeContent( $translation, $translationTitle );
162 $updater->setContent( SlotRecord::MAIN, $content );
163 $updater->setFlags( EDIT_FORCE_BOT );
164 $updater->saveRevision( $commentStoreComment );
165
166 $status = $updater->getStatus();
167 $translationImportStatuses[] = $status;
168 if ( !$status->isOK() ) {
169 $failedStatuses[ $translationTitle->getPrefixedText() ] = $status;
170 }
171 }
172
173 ++$currentTranslation;
174 if ( $progressReporter ) {
175 $progressReporter(
176 $messageTitle,
177 $translationImportStatuses,
178 count( $messagesWithTranslations ),
179 $currentTranslation
180 );
181 }
182 }
183
184 if ( $failedStatuses ) {
185 foreach ( $failedStatuses as $failedStatus ) {
186 $importStatus->merge( $failedStatus );
187 }
188
189 $importStatus->setResult( false, $failedStatuses );
190 }
191
192 return $importStatus;
193 }
194
195 private function getLanguagesFromHeader( array $csvHeader ): Status {
196 if ( count( $csvHeader ) < 2 ) {
197 return Status::newFatal(
198 'CSV has < 2 columns. Assuming that there are no languages to import'
199 );
200 }
201
202 $languageCodesInHeader = array_slice( $csvHeader, 2 );
203 if ( $languageCodesInHeader === [] ) {
204 return Status::newFatal( 'No languages found for import' );
205 }
206
207 $invalidLanguageCodes = [];
208 $indexedLanguageCodes = [];
209 // First two columns are message title and definition
210 $originalLanguageIndex = 2;
211 foreach ( $languageCodesInHeader as $languageCode ) {
212 if ( !Utilities::isSupportedLanguageCode( strtolower( $languageCode ) ) ) {
213 $invalidLanguageCodes[] = $languageCode;
214 } else {
215 // Language codes maybe in upper case, convert to lower case for further use.
216 $indexedLanguageCodes[ strtolower( $languageCode ) ] = $originalLanguageIndex;
217 }
218 ++$originalLanguageIndex;
219 }
220
221 if ( $invalidLanguageCodes ) {
222 return Status::newFatal(
223 'Invalid language codes detected in CSV header: ' . implode( ', ', $invalidLanguageCodes )
224 );
225 }
226
227 return Status::newGood( $indexedLanguageCodes );
228 }
229
230 private function getMessageHandleIfValid( string $messageTitle ): ?MessageHandle {
231 $title = Title::newFromText( $messageTitle );
232 if ( $title === null ) {
233 return null;
234 }
235
236 $handle = new MessageHandle( $title );
237 if ( $handle->isValid() ) {
238 return $handle;
239 }
240
241 return null;
242 }
243
244 private function isCsvRowEmpty( array $csvRow ): bool {
245 return count( $csvRow ) === 1 && ( $csvRow[0] === null || trim( $csvRow[0] ) === '' );
246 }
247}
return[ 'Translate:AggregateGroupManager'=> static function(MediaWikiServices $services):AggregateGroupManager { return new AggregateGroupManager($services->getTitleFactory(), $services->get( 'Translate:MessageGroupMetadata'));}, 'Translate:AggregateGroupMessageGroupFactory'=> static function(MediaWikiServices $services):AggregateGroupMessageGroupFactory { return new AggregateGroupMessageGroupFactory($services->get( 'Translate:MessageGroupMetadata'));}, 'Translate:ConfigHelper'=> static function():ConfigHelper { return new ConfigHelper();}, 'Translate:CsvTranslationImporter'=> static function(MediaWikiServices $services):CsvTranslationImporter { return new CsvTranslationImporter( $services->getWikiPageFactory());}, 'Translate:EntitySearch'=> static function(MediaWikiServices $services):EntitySearch { return new EntitySearch($services->getMainWANObjectCache(), $services->getCollationFactory() ->makeCollation( 'uca-default-u-kn'), MessageGroups::singleton(), $services->getNamespaceInfo(), $services->get( 'Translate:MessageIndex'), $services->getTitleParser(), $services->getTitleFormatter());}, 'Translate:ExternalMessageSourceStateComparator'=> static function(MediaWikiServices $services):ExternalMessageSourceStateComparator { return new ExternalMessageSourceStateComparator(new SimpleStringComparator(), $services->getRevisionLookup(), $services->getPageStore());}, 'Translate:ExternalMessageSourceStateImporter'=> static function(MediaWikiServices $services):ExternalMessageSourceStateImporter { return new ExternalMessageSourceStateImporter($services->get( 'Translate:GroupSynchronizationCache'), $services->getJobQueueGroup(), LoggerFactory::getInstance(LogNames::GROUP_SYNCHRONIZATION), $services->get( 'Translate:MessageIndex'), $services->getTitleFactory(), $services->get( 'Translate:MessageGroupSubscription'), new ServiceOptions(ExternalMessageSourceStateImporter::CONSTRUCTOR_OPTIONS, $services->getMainConfig()));}, 'Translate:FileBasedMessageGroupFactory'=> static function(MediaWikiServices $services):FileBasedMessageGroupFactory { return new FileBasedMessageGroupFactory(new MessageGroupConfigurationParser(), $services->getContentLanguageCode() ->toString(), new ServiceOptions(FileBasedMessageGroupFactory::SERVICE_OPTIONS, $services->getMainConfig()),);}, 'Translate:FileFormatFactory'=> static function(MediaWikiServices $services):FileFormatFactory { return new FileFormatFactory( $services->getObjectFactory());}, 'Translate:GroupSynchronizationCache'=> static function(MediaWikiServices $services):GroupSynchronizationCache { return new GroupSynchronizationCache( $services->get( 'Translate:PersistentCache'));}, 'Translate:HookDefinedMessageGroupFactory'=> static function(MediaWikiServices $services):HookDefinedMessageGroupFactory { return new HookDefinedMessageGroupFactory( $services->get( 'Translate:HookRunner'));}, 'Translate:HookRunner'=> static function(MediaWikiServices $services):HookRunner { return new HookRunner( $services->getHookContainer());}, 'Translate:MessageBundleDependencyPurger'=> static function(MediaWikiServices $services):MessageBundleDependencyPurger { return new MessageBundleDependencyPurger( $services->get( 'Translate:TranslatableBundleFactory'));}, 'Translate:MessageBundleMessageGroupFactory'=> static function(MediaWikiServices $services):MessageBundleMessageGroupFactory { return new MessageBundleMessageGroupFactory($services->get( 'Translate:MessageGroupMetadata'), new ServiceOptions(MessageBundleMessageGroupFactory::SERVICE_OPTIONS, $services->getMainConfig()),);}, 'Translate:MessageBundleStore'=> static function(MediaWikiServices $services):MessageBundleStore { return new MessageBundleStore($services->get( 'Translate:RevTagStore'), $services->getJobQueueGroup(), $services->getLanguageNameUtils(), $services->get( 'Translate:MessageIndex'), $services->get( 'Translate:MessageGroupMetadata'));}, 'Translate:MessageBundleTranslationLoader'=> static function(MediaWikiServices $services):MessageBundleTranslationLoader { return new MessageBundleTranslationLoader( $services->getLanguageFallback());}, 'Translate:MessageGroupMetadata'=> static function(MediaWikiServices $services):MessageGroupMetadata { return new MessageGroupMetadata( $services->getConnectionProvider());}, 'Translate:MessageGroupReviewStore'=> static function(MediaWikiServices $services):MessageGroupReviewStore { return new MessageGroupReviewStore($services->getConnectionProvider(), $services->get( 'Translate:HookRunner'));}, 'Translate:MessageGroupStatsTableFactory'=> static function(MediaWikiServices $services):MessageGroupStatsTableFactory { return new MessageGroupStatsTableFactory($services->get( 'Translate:ProgressStatsTableFactory'), $services->getLinkRenderer(), $services->get( 'Translate:MessageGroupReviewStore'), $services->get( 'Translate:MessageGroupMetadata'), $services->getMainConfig() ->get( 'TranslateWorkflowStates') !==false);}, 'Translate:MessageGroupSubscription'=> static function(MediaWikiServices $services):MessageGroupSubscription { return new MessageGroupSubscription($services->get( 'Translate:MessageGroupSubscriptionStore'), $services->getJobQueueGroup(), $services->getUserIdentityLookup(), LoggerFactory::getInstance(LogNames::GROUP_SUBSCRIPTION), new ServiceOptions(MessageGroupSubscription::CONSTRUCTOR_OPTIONS, $services->getMainConfig()));}, 'Translate:MessageGroupSubscriptionHookHandler'=> static function(MediaWikiServices $services):?MessageGroupSubscriptionHookHandler { if(! $services->getExtensionRegistry() ->isLoaded( 'Echo')) { return null;} return new MessageGroupSubscriptionHookHandler($services->get( 'Translate:MessageGroupSubscription'), $services->getUserFactory());}, 'Translate:MessageGroupSubscriptionStore'=> static function(MediaWikiServices $services):MessageGroupSubscriptionStore { return new MessageGroupSubscriptionStore( $services->getConnectionProvider());}, 'Translate:MessageIndex'=> static function(MediaWikiServices $services):MessageIndex { $params=(array) $services->getMainConfig() ->get( 'TranslateMessageIndex');$class=array_shift( $params);$implementationMap=['HashMessageIndex'=> HashMessageIndex::class, 'CDBMessageIndex'=> CDBMessageIndex::class, 'DatabaseMessageIndex'=> DatabaseMessageIndex::class, 'hash'=> HashMessageIndex::class, 'cdb'=> CDBMessageIndex::class, 'database'=> DatabaseMessageIndex::class,];$messageIndexStoreClass=$implementationMap[$class] ?? $implementationMap['database'];return new MessageIndex(new $messageIndexStoreClass, $services->getMainWANObjectCache(), $services->getJobQueueGroup(), $services->get( 'Translate:HookRunner'), LoggerFactory::getInstance(LogNames::MAIN), $services->getMainObjectStash(), $services->getConnectionProvider(), new ServiceOptions(MessageIndex::SERVICE_OPTIONS, $services->getMainConfig()),);}, 'Translate:MessagePrefixStats'=> static function(MediaWikiServices $services):MessagePrefixStats { return new MessagePrefixStats( $services->getTitleParser());}, 'Translate:ParsingPlaceholderFactory'=> static function():ParsingPlaceholderFactory { return new ParsingPlaceholderFactory();}, 'Translate:PersistentCache'=> static function(MediaWikiServices $services):PersistentCache { return new PersistentDatabaseCache($services->getConnectionProvider(), $services->getJsonCodec());}, 'Translate:ProgressStatsTableFactory'=> static function(MediaWikiServices $services):ProgressStatsTableFactory { return new ProgressStatsTableFactory($services->getLinkRenderer(), $services->get( 'Translate:ConfigHelper'), $services->get( 'Translate:MessageGroupMetadata'));}, 'Translate:RevTagStore'=> static function(MediaWikiServices $services):RevTagStore { return new RevTagStore( $services->getConnectionProvider());}, 'Translate:SubpageListBuilder'=> static function(MediaWikiServices $services):SubpageListBuilder { return new SubpageListBuilder($services->get( 'Translate:TranslatableBundleFactory'), $services->getLinkBatchFactory());}, 'Translate:TranslatableBundleDeleter'=> static function(MediaWikiServices $services):TranslatableBundleDeleter { return new TranslatableBundleDeleter($services->getMainObjectStash(), $services->getJobQueueGroup(), $services->get( 'Translate:SubpageListBuilder'), $services->get( 'Translate:TranslatableBundleFactory'));}, 'Translate:TranslatableBundleExporter'=> static function(MediaWikiServices $services):TranslatableBundleExporter { return new TranslatableBundleExporter($services->get( 'Translate:SubpageListBuilder'), $services->getWikiExporterFactory(), $services->getConnectionProvider());}, 'Translate:TranslatableBundleFactory'=> static function(MediaWikiServices $services):TranslatableBundleFactory { return new TranslatableBundleFactory($services->get( 'Translate:TranslatablePageStore'), $services->get( 'Translate:MessageBundleStore'));}, 'Translate:TranslatableBundleImporter'=> static function(MediaWikiServices $services):TranslatableBundleImporter { return new TranslatableBundleImporter($services->getWikiImporterFactory(), $services->get( 'Translate:TranslatablePageParser'), $services->getRevisionLookup(), $services->getNamespaceInfo(), $services->getTitleFactory(), $services->getFormatterFactory());}, 'Translate:TranslatableBundleMover'=> static function(MediaWikiServices $services):TranslatableBundleMover { return new TranslatableBundleMover($services->getMovePageFactory(), $services->getJobQueueGroup(), $services->getLinkBatchFactory(), $services->get( 'Translate:TranslatableBundleFactory'), $services->get( 'Translate:SubpageListBuilder'), $services->getConnectionProvider(), $services->getObjectCacheFactory(), $services->getMainConfig() ->get( 'TranslatePageMoveLimit'));}, 'Translate:TranslatableBundleStatusStore'=> static function(MediaWikiServices $services):TranslatableBundleStatusStore { return new TranslatableBundleStatusStore($services->getConnectionProvider() ->getPrimaryDatabase(), $services->getCollationFactory() ->makeCollation( 'uca-default-u-kn'), $services->getDBLoadBalancer() ->getMaintenanceConnectionRef(DB_PRIMARY));}, 'Translate:TranslatablePageMarker'=> static function(MediaWikiServices $services):TranslatablePageMarker { return new TranslatablePageMarker($services->getConnectionProvider(), $services->getJobQueueGroup(), $services->getLinkRenderer(), MessageGroups::singleton(), $services->get( 'Translate:MessageIndex'), $services->getTitleFormatter(), $services->getTitleParser(), $services->get( 'Translate:TranslatablePageParser'), $services->get( 'Translate:TranslatablePageStore'), $services->get( 'Translate:TranslatablePageStateStore'), $services->get( 'Translate:TranslationUnitStoreFactory'), $services->get( 'Translate:MessageGroupMetadata'), $services->getWikiPageFactory(), $services->get( 'Translate:TranslatablePageView'), $services->get( 'Translate:MessageGroupSubscription'), $services->getFormatterFactory(), $services->get( 'Translate:HookRunner'),);}, 'Translate:TranslatablePageMessageGroupFactory'=> static function(MediaWikiServices $services):TranslatablePageMessageGroupFactory { return new TranslatablePageMessageGroupFactory(new ServiceOptions(TranslatablePageMessageGroupFactory::SERVICE_OPTIONS, $services->getMainConfig()),);}, 'Translate:TranslatablePageParser'=> static function(MediaWikiServices $services):TranslatablePageParser { return new TranslatablePageParser($services->get( 'Translate:ParsingPlaceholderFactory'));}, 'Translate:TranslatablePageStateStore'=> static function(MediaWikiServices $services):TranslatablePageStateStore { return new TranslatablePageStateStore($services->get( 'Translate:PersistentCache'), $services->getPageStore());}, 'Translate:TranslatablePageStore'=> static function(MediaWikiServices $services):TranslatablePageStore { return new TranslatablePageStore($services->get( 'Translate:MessageIndex'), $services->getJobQueueGroup(), $services->get( 'Translate:RevTagStore'), $services->getConnectionProvider(), $services->get( 'Translate:TranslatableBundleStatusStore'), $services->get( 'Translate:TranslatablePageParser'), $services->get( 'Translate:MessageGroupMetadata'));}, 'Translate:TranslatablePageView'=> static function(MediaWikiServices $services):TranslatablePageView { return new TranslatablePageView($services->getConnectionProvider(), $services->get( 'Translate:TranslatablePageStateStore'), new ServiceOptions(TranslatablePageView::SERVICE_OPTIONS, $services->getMainConfig()));}, 'Translate:TranslateSandbox'=> static function(MediaWikiServices $services):TranslateSandbox { return new TranslateSandbox($services->getUserFactory(), $services->getConnectionProvider(), $services->getPermissionManager(), $services->getAuthManager(), $services->getUserGroupManager(), $services->getActorStore(), $services->getUserOptionsManager(), $services->getJobQueueGroup(), $services->get( 'Translate:HookRunner'), new ServiceOptions(TranslateSandbox::CONSTRUCTOR_OPTIONS, $services->getMainConfig()));}, 'Translate:TranslationStashReader'=> static function(MediaWikiServices $services):TranslationStashReader { return new TranslationStashStorage( $services->getConnectionProvider() ->getPrimaryDatabase());}, 'Translate:TranslationStatsDataProvider'=> static function(MediaWikiServices $services):TranslationStatsDataProvider { return new TranslationStatsDataProvider(new ServiceOptions(TranslationStatsDataProvider::CONSTRUCTOR_OPTIONS, $services->getMainConfig()), $services->getObjectFactory(), $services->getConnectionProvider());}, 'Translate:TranslationUnitStoreFactory'=> static function(MediaWikiServices $services):TranslationUnitStoreFactory { return new TranslationUnitStoreFactory( $services->getDBLoadBalancer());}, 'Translate:TranslatorActivity'=> static function(MediaWikiServices $services):TranslatorActivity { $query=new TranslatorActivityQuery($services->getMainConfig(), $services->getDBLoadBalancer());return new TranslatorActivity($services->getMainObjectStash(), $query, $services->getJobQueueGroup());}, 'Translate:TtmServerFactory'=> static function(MediaWikiServices $services):TtmServerFactory { $config=$services->getMainConfig();$default=$config->get( 'TranslateTranslationDefaultService');if( $default===false) { $default=null;} return new TtmServerFactory( $config->get( 'TranslateTranslationServices'), $default);}, 'Translate:WorkflowStatesMessageGroupLoader'=> static function(MediaWikiServices $services):WorkflowStatesMessageGroupLoader { return new WorkflowStatesMessageGroupLoader(new ServiceOptions(WorkflowStatesMessageGroupLoader::CONSTRUCTOR_OPTIONS, $services->getMainConfig()),);},]
@phpcs-require-sorted-array
importData(array $messagesWithTranslations, Authority $authority, string $comment, ?callable $progressReporter=null)
Import the data returned from the parseFile method.
Class for pointing to messages, like Title class is for titles.
Essentially random collection of helper functions, similar to GlobalFunctions.php.
Definition Utilities.php:29