[YouTube] Add parser for attributedDescription
Also update the mock of the next InnerTube endpoint response of the YoutubeStreamExtractorDefaultTest.DescriptionTestUnboxing test class with an attributedDescription instead of a regular description
This commit is contained in:
		
							parent
							
								
									4cae66f1f9
								
							
						
					
					
						commit
						099b53cc4f
					
				
					 3 changed files with 92 additions and 1 deletions
				
			
		|  | @ -1009,6 +1009,90 @@ public final class YoutubeParsingHelper { | ||||||
|         return text; |         return text; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|  |     /** | ||||||
|  |      * Parse a video description in the new "attributed" format, which contains the entire visible | ||||||
|  |      * plaintext ({@code content}) and an array of {@code commandRuns}. | ||||||
|  |      * | ||||||
|  |      * <p> | ||||||
|  |      * The {@code commandRuns} include the links and their position in the text. | ||||||
|  |      * </p> | ||||||
|  |      * | ||||||
|  |      * @param attributedDescription the JSON object of the attributed description | ||||||
|  |      * @return the parsed description, in HTML format, as a string | ||||||
|  |      */ | ||||||
|  |     @Nullable | ||||||
|  |     public static String getAttributedDescription( | ||||||
|  |             @Nullable final JsonObject attributedDescription) { | ||||||
|  |         if (isNullOrEmpty(attributedDescription)) { | ||||||
|  |             return null; | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  |         final String content = attributedDescription.getString("content"); | ||||||
|  |         final JsonArray commandRuns = attributedDescription.getArray("commandRuns"); | ||||||
|  |         if (content == null || commandRuns.isEmpty()) { | ||||||
|  |             return null; | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  |         final StringBuilder textBuilder = new StringBuilder(); | ||||||
|  |         int textStart = 0; | ||||||
|  | 
 | ||||||
|  |         for (final Object commandRun: commandRuns) { | ||||||
|  |             if (!(commandRun instanceof JsonObject)) { | ||||||
|  |                 continue; | ||||||
|  |             } | ||||||
|  | 
 | ||||||
|  |             final JsonObject run = ((JsonObject) commandRun); | ||||||
|  |             final int startIndex = run.getInt("startIndex", -1); | ||||||
|  |             final int length = run.getInt("length"); | ||||||
|  |             final JsonObject navigationEndpoint = run.getObject("onTap") | ||||||
|  |                     .getObject("innertubeCommand"); | ||||||
|  | 
 | ||||||
|  |             if (startIndex < 0 || length < 1 || navigationEndpoint == null) { | ||||||
|  |                 continue; | ||||||
|  |             } | ||||||
|  | 
 | ||||||
|  |             final String url; | ||||||
|  |             try { | ||||||
|  |                 url = getUrlFromNavigationEndpoint(navigationEndpoint); | ||||||
|  |             } catch (final ParsingException e) { | ||||||
|  |                 continue; | ||||||
|  |             } | ||||||
|  | 
 | ||||||
|  |             if (url == null) { | ||||||
|  |                 continue; | ||||||
|  |             } | ||||||
|  | 
 | ||||||
|  |             // Append text before the link | ||||||
|  |             if (startIndex > textStart) { | ||||||
|  |                 textBuilder.append(content, textStart, startIndex); | ||||||
|  |             } | ||||||
|  | 
 | ||||||
|  |             // Trim and append link text | ||||||
|  |             // Channel/Video format: 3xu00a0, (/ •), u00a0, <Name>, 2xu00a0 | ||||||
|  |             final String linkText = content.substring(startIndex, startIndex + length) | ||||||
|  |                     .replace('\u00a0', ' ') | ||||||
|  |                     .trim() | ||||||
|  |                     .replaceFirst("^[/•] *", ""); | ||||||
|  | 
 | ||||||
|  |             textBuilder.append("<a href=\"") | ||||||
|  |                     .append(url) | ||||||
|  |                     .append("\">") | ||||||
|  |                     .append(linkText) | ||||||
|  |                     .append("</a>"); | ||||||
|  | 
 | ||||||
|  |             textStart = startIndex + length; | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  |         // Append the remaining text | ||||||
|  |         if (textStart < content.length()) { | ||||||
|  |             textBuilder.append(content.substring(textStart)); | ||||||
|  |         } | ||||||
|  | 
 | ||||||
|  |         return textBuilder.toString() | ||||||
|  |                 .replaceAll("\\n", "<br>") | ||||||
|  |                 .replaceAll(" {2}", "  "); | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|     @Nullable |     @Nullable | ||||||
|     public static String getTextFromObject(final JsonObject textObject) throws ParsingException { |     public static String getTextFromObject(final JsonObject textObject) throws ParsingException { | ||||||
|         return getTextFromObject(textObject, false); |         return getTextFromObject(textObject, false); | ||||||
|  |  | ||||||
|  | @ -34,6 +34,7 @@ import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper | ||||||
| import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getJsonIosPostResponse; | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getJsonIosPostResponse; | ||||||
| import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getJsonPostResponse; | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getJsonPostResponse; | ||||||
| import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getTextFromObject; | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getTextFromObject; | ||||||
|  | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.getAttributedDescription; | ||||||
| import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareAndroidMobileJsonBuilder; | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareAndroidMobileJsonBuilder; | ||||||
| import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareDesktopJsonBuilder; | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareDesktopJsonBuilder; | ||||||
| import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareIosMobileJsonBuilder; | import static org.schabi.newpipe.extractor.services.youtube.YoutubeParsingHelper.prepareIosMobileJsonBuilder; | ||||||
|  | @ -288,6 +289,12 @@ public class YoutubeStreamExtractor extends StreamExtractor { | ||||||
|             if (!isNullOrEmpty(description)) { |             if (!isNullOrEmpty(description)) { | ||||||
|                 return new Description(description, Description.HTML); |                 return new Description(description, Description.HTML); | ||||||
|             } |             } | ||||||
|  | 
 | ||||||
|  |             final String attributedDescription = getAttributedDescription( | ||||||
|  |                     getVideoSecondaryInfoRenderer().getObject("attributedDescription")); | ||||||
|  |             if (!isNullOrEmpty(attributedDescription)) { | ||||||
|  |                 return new Description(attributedDescription, Description.HTML); | ||||||
|  |             } | ||||||
|         } catch (final ParsingException ignored) { |         } catch (final ParsingException ignored) { | ||||||
|             // Age-restricted videos cause a ParsingException here |             // Age-restricted videos cause a ParsingException here | ||||||
|         } |         } | ||||||
|  |  | ||||||
										
											
												File diff suppressed because one or more lines are too long
											
										
									
								
							
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue