<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="ru">
	<id>http://digida.mgpu.ru/index.php?action=history&amp;feed=atom&amp;title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_%28syllabus%29_2025%2F%D0%A3%D1%80%D0%BE%D0%BA_1</id>
	<title>Методы информационного анализа текста (syllabus) 2025/Урок 1 - История изменений</title>
	<link rel="self" type="application/atom+xml" href="http://digida.mgpu.ru/index.php?action=history&amp;feed=atom&amp;title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_%28syllabus%29_2025%2F%D0%A3%D1%80%D0%BE%D0%BA_1"/>
	<link rel="alternate" type="text/html" href="http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;action=history"/>
	<updated>2026-04-23T10:14:00Z</updated>
	<subtitle>История изменений этой страницы в вики</subtitle>
	<generator>MediaWiki 1.44.0</generator>
	<entry>
		<id>http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=44399&amp;oldid=prev</id>
		<title>Patarakin в 07:30, 24 февраля 2026</title>
		<link rel="alternate" type="text/html" href="http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=44399&amp;oldid=prev"/>
		<updated>2026-02-24T07:30:01Z</updated>

		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table style=&quot;background-color: #fff; color: #202122;&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;tr class=&quot;diff-title&quot; lang=&quot;ru&quot;&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;← Предыдущая версия&lt;/td&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;Версия от 10:30, 24 февраля 2026&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot; id=&quot;mw-diff-left-l73&quot;&gt;Строка 73:&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;Строка 73:&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;data &amp;lt;- read_csv(&amp;quot;metaph-science-lens.csv&amp;quot;)&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;data &amp;lt;- read_csv(&amp;quot;metaph-science-lens.csv&amp;quot;)&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;br&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;br&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;data_AS &amp;lt;- read_csv(&quot;https://raw.githubusercontent.com/patarakin/stat-data/refs/heads/main/datasets/csv/lens-acad-sci-psych.csv&quot;)&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;br&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;br&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# ====================================================================&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# ====================================================================&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Patarakin</name></author>
	</entry>
	<entry>
		<id>http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=44398&amp;oldid=prev</id>
		<title>Patarakin в 07:28, 24 февраля 2026</title>
		<link rel="alternate" type="text/html" href="http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=44398&amp;oldid=prev"/>
		<updated>2026-02-24T07:28:45Z</updated>

		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table style=&quot;background-color: #fff; color: #202122;&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;tr class=&quot;diff-title&quot; lang=&quot;ru&quot;&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;← Предыдущая версия&lt;/td&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;Версия от 10:28, 24 февраля 2026&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot; id=&quot;mw-diff-left-l214&quot;&gt;Строка 214:&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;Строка 214:&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# ====================================================================&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# ====================================================================&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/syntaxhighlight&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/syntaxhighlight&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-side-deleted&quot;&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;[[Категория:Lesson]]&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Patarakin</name></author>
	</entry>
	<entry>
		<id>http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=34186&amp;oldid=prev</id>
		<title>Patarakin в 04:29, 8 ноября 2025</title>
		<link rel="alternate" type="text/html" href="http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=34186&amp;oldid=prev"/>
		<updated>2025-11-08T04:29:29Z</updated>

		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table style=&quot;background-color: #fff; color: #202122;&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;col class=&quot;diff-marker&quot; /&gt;
				&lt;col class=&quot;diff-content&quot; /&gt;
				&lt;tr class=&quot;diff-title&quot; lang=&quot;ru&quot;&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;← Предыдущая версия&lt;/td&gt;
				&lt;td colspan=&quot;2&quot; style=&quot;background-color: #fff; color: #202122; text-align: center;&quot;&gt;Версия от 07:29, 8 ноября 2025&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot; id=&quot;mw-diff-left-l18&quot;&gt;Строка 18:&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;Строка 18:&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# Установить новую рабочую директорию (при необходимости)&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# Установить новую рабочую директорию (при необходимости)&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# setwd(&amp;quot;путь/к/вашей/папке&amp;quot;)&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# setwd(&amp;quot;путь/к/вашей/папке&amp;quot;)&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;−&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;setwd(&quot;C:/Users/Evgeny/Documents/R_Text&quot;)&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot; data-marker=&quot;+&quot;&gt;&lt;/td&gt;&lt;td style=&quot;color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;# &lt;/ins&gt;setwd(&quot;C:/Users/Evgeny/Documents/R_Text&quot;)&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;br&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;br&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# Показать все файлы, включая скрытые&lt;/div&gt;&lt;/td&gt;&lt;td class=&quot;diff-marker&quot;&gt;&lt;/td&gt;&lt;td style=&quot;background-color: #f8f9fa; color: #202122; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #eaecf0; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;# Показать все файлы, включая скрытые&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Patarakin</name></author>
	</entry>
	<entry>
		<id>http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=31647&amp;oldid=prev</id>
		<title>Patarakin: Новая страница: «&lt;syntaxhighlight lang=&quot;R&quot; line&gt; # ============================================================================ # ЗАНЯТИЕ: Анализ текста в R с использованием tidytext # Автор: Евгений Патаракин # Дата: Сентябрь 2025 # ============================================================================  # ==================== # 1. НАСТРОЙКА РАБОЧЕЙ СРЕДЫ # ====================  #...»</title>
		<link rel="alternate" type="text/html" href="http://digida.mgpu.ru/index.php?title=%D0%9C%D0%B5%D1%82%D0%BE%D0%B4%D1%8B_%D0%B8%D0%BD%D1%84%D0%BE%D1%80%D0%BC%D0%B0%D1%86%D0%B8%D0%BE%D0%BD%D0%BD%D0%BE%D0%B3%D0%BE_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7%D0%B0_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0_(syllabus)_2025/%D0%A3%D1%80%D0%BE%D0%BA_1&amp;diff=31647&amp;oldid=prev"/>
		<updated>2025-09-18T14:18:54Z</updated>

		<summary type="html">&lt;p&gt;Новая страница: «&amp;lt;syntaxhighlight lang=&amp;quot;R&amp;quot; line&amp;gt; # ============================================================================ # ЗАНЯТИЕ: Анализ текста в R с использованием tidytext # Автор: Евгений Патаракин # Дата: Сентябрь 2025 # ============================================================================  # ==================== # 1. НАСТРОЙКА РАБОЧЕЙ СРЕДЫ # ====================  #...»&lt;/p&gt;
&lt;p&gt;&lt;b&gt;Новая страница&lt;/b&gt;&lt;/p&gt;&lt;div&gt;&amp;lt;syntaxhighlight lang=&amp;quot;R&amp;quot; line&amp;gt;&lt;br /&gt;
# ============================================================================&lt;br /&gt;
# ЗАНЯТИЕ: Анализ текста в R с использованием tidytext&lt;br /&gt;
# Автор: Евгений Патаракин&lt;br /&gt;
# Дата: Сентябрь 2025&lt;br /&gt;
# ============================================================================&lt;br /&gt;
&lt;br /&gt;
# ====================&lt;br /&gt;
# 1. НАСТРОЙКА РАБОЧЕЙ СРЕДЫ&lt;br /&gt;
# ====================&lt;br /&gt;
&lt;br /&gt;
# Показать текущую рабочую директорию&lt;br /&gt;
getwd()&lt;br /&gt;
&lt;br /&gt;
# Посмотреть содержимое текущей директории&lt;br /&gt;
list.files()&lt;br /&gt;
&lt;br /&gt;
# Установить новую рабочую директорию (при необходимости)&lt;br /&gt;
# setwd(&amp;quot;путь/к/вашей/папке&amp;quot;)&lt;br /&gt;
setwd(&amp;quot;C:/Users/Evgeny/Documents/R_Text&amp;quot;)&lt;br /&gt;
&lt;br /&gt;
# Показать все файлы, включая скрытые&lt;br /&gt;
list.files(all.files = TRUE)&lt;br /&gt;
&lt;br /&gt;
# Показать файлы определённого типа&lt;br /&gt;
list.files(pattern = &amp;quot;*.csv&amp;quot;)&lt;br /&gt;
&lt;br /&gt;
# ====================&lt;br /&gt;
# 2. ОСНОВЫ СИНТАКСИСА R&lt;br /&gt;
# ====================&lt;br /&gt;
&lt;br /&gt;
# Создание переменных&lt;br /&gt;
text_example &amp;lt;- &amp;quot;Это пример текста для анализа&amp;quot;&lt;br /&gt;
numbers &amp;lt;- c(1, 2, 3, 4, 5)&lt;br /&gt;
logical_var &amp;lt;- TRUE&lt;br /&gt;
&lt;br /&gt;
# Просмотр структуры объектов&lt;br /&gt;
str(text_example)&lt;br /&gt;
str(numbers)&lt;br /&gt;
&lt;br /&gt;
# Типы данных&lt;br /&gt;
class(text_example)  # character&lt;br /&gt;
class(numbers)       # numeric&lt;br /&gt;
class(logical_var)   # logical&lt;br /&gt;
&lt;br /&gt;
# Векторы, списки и data.frame&lt;br /&gt;
vector_example &amp;lt;- c(&amp;quot;слово1&amp;quot;, &amp;quot;слово2&amp;quot;, &amp;quot;слово3&amp;quot;)&lt;br /&gt;
list_example &amp;lt;- list(text = text_example, nums = numbers)&lt;br /&gt;
df_example &amp;lt;- data.frame(&lt;br /&gt;
  id = 1:3,&lt;br /&gt;
  words = c(&amp;quot;привет&amp;quot;, &amp;quot;мир&amp;quot;, &amp;quot;анализ&amp;quot;),&lt;br /&gt;
  freq = c(10, 8, 15)&lt;br /&gt;
)&lt;br /&gt;
&lt;br /&gt;
# Просмотр данных&lt;br /&gt;
print(df_example)&lt;br /&gt;
head(df_example)&lt;br /&gt;
summary(df_example)&lt;br /&gt;
&lt;br /&gt;
# ====================&lt;br /&gt;
# 3. ЧТЕНИЕ И ЗАПИСЬ ФАЙЛОВ&lt;br /&gt;
# ====================&lt;br /&gt;
&lt;br /&gt;
# Установка и загрузка необходимых пакетов&lt;br /&gt;
if (!require(readr)) install.packages(&amp;quot;readr&amp;quot;)&lt;br /&gt;
if (!require(readxl)) install.packages(&amp;quot;readxl&amp;quot;)&lt;br /&gt;
library(readr)&lt;br /&gt;
library(readxl)&lt;br /&gt;
&lt;br /&gt;
# Чтение CSV файлов&lt;br /&gt;
# metaph-science-lens.csv&lt;br /&gt;
&lt;br /&gt;
data &amp;lt;- read_csv(&amp;quot;metaph-science-lens.csv&amp;quot;)&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
# ====================================================================&lt;br /&gt;
# УРОК: Работа с таблицей из metadata metaph-science-lens.csv&lt;br /&gt;
# Основные пакеты: dplyr, tidyr, tidytext, ggplot2&lt;br /&gt;
# ====================================================================&lt;br /&gt;
&lt;br /&gt;
# 1. ЗАГРУЗКА ПАКЕТОВ&lt;br /&gt;
if (!require(tidyverse)) install.packages(&amp;quot;tidyverse&amp;quot;)&lt;br /&gt;
if (!require(tidytext))  install.packages(&amp;quot;tidytext&amp;quot;)&lt;br /&gt;
library(dplyr)&lt;br /&gt;
library(tidyr)&lt;br /&gt;
library(tidytext)&lt;br /&gt;
library(ggplot2)&lt;br /&gt;
&lt;br /&gt;
# 2. ЗАГРУЗКА ДАННЫХ&lt;br /&gt;
# Предполагаем, что файл metaph-science-lens.csv в рабочей директории&lt;br /&gt;
data &amp;lt;- read_csv(&amp;quot;metaph-science-lens.csv&amp;quot;)&lt;br /&gt;
&lt;br /&gt;
# 3. ПОКАЗАТЬ НАЗВАНИЯ ВСЕХ СТОЛБЦОВ&lt;br /&gt;
colnames(data)&lt;br /&gt;
&lt;br /&gt;
# 4. СОЗДАНИЕ НОВОЙ ТАБЛИЦЫ С ВЫБОРКОЙ СТОЛБЦОВ&lt;br /&gt;
# Нас интересуют только Title, Abstract, Author/s, Field of Study, Keywords, Citing Work Count&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
data %&amp;gt;%&lt;br /&gt;
  select(&lt;br /&gt;
    Title,&lt;br /&gt;
    Abstract,&lt;br /&gt;
    `Author/s`,&lt;br /&gt;
    `Fields of Study`,&lt;br /&gt;
    Keywords,&lt;br /&gt;
    `Citing Works Count`&lt;br /&gt;
  )&lt;br /&gt;
&lt;br /&gt;
data_selected &amp;lt;- data %&amp;gt;%&lt;br /&gt;
  select(&lt;br /&gt;
    Title,&lt;br /&gt;
    Abstract,&lt;br /&gt;
    `Author/s`,&lt;br /&gt;
    `Fields of Study`,&lt;br /&gt;
    Keywords,&lt;br /&gt;
    `Citing Works Count`&lt;br /&gt;
  )&lt;br /&gt;
&lt;br /&gt;
# Просмотр первых строк новой таблицы&lt;br /&gt;
glimpse(data_selected)&lt;br /&gt;
head(data_selected)&lt;br /&gt;
&lt;br /&gt;
# 5. ПОДГОТОВКА TEXT-DATA С TIDYTEXT&lt;br /&gt;
# 5.1 Токенизация абстрактов на слова&lt;br /&gt;
&lt;br /&gt;
abstract_tokens &amp;lt;- data_selected %&amp;gt;%&lt;br /&gt;
  filter(!is.na(Abstract), Abstract != &amp;quot;&amp;quot;) %&amp;gt;%             # убираем пустые Abstract&lt;br /&gt;
  select(Title, Abstract) %&amp;gt;%&lt;br /&gt;
  unnest_tokens(word, Abstract)&lt;br /&gt;
&lt;br /&gt;
# Показать первые 10 токенов&lt;br /&gt;
head(abstract_tokens, 10)&lt;br /&gt;
&lt;br /&gt;
# 5.2 Удаление английских стоп-слов&lt;br /&gt;
abstract_clean &amp;lt;- abstract_tokens %&amp;gt;%&lt;br /&gt;
  anti_join(get_stopwords(), by = &amp;quot;word&amp;quot;)&lt;br /&gt;
&lt;br /&gt;
####&lt;br /&gt;
custom_stop &amp;lt;- tibble(word = c(&amp;quot;de&amp;quot;, &amp;quot;p&amp;quot;, &amp;quot;la&amp;quot;))&lt;br /&gt;
abstract_clean2 &amp;lt;- abstract_clean %&amp;gt;%&lt;br /&gt;
  anti_join(custom_stop, by = &amp;quot;word&amp;quot;)&lt;br /&gt;
###&lt;br /&gt;
&lt;br /&gt;
# 5.3 Подсчет частоты слов&lt;br /&gt;
word_counts &amp;lt;- abstract_clean2 %&amp;gt;%&lt;br /&gt;
  count(word, sort = TRUE)&lt;br /&gt;
&lt;br /&gt;
# Показать топ-20 самых частых слов&lt;br /&gt;
head(word_counts, 20)&lt;br /&gt;
&lt;br /&gt;
# 6. ВИЗУАЛИЗАЦИЯ РАСПРЕДЕЛЕНИЯ СЛОВ&lt;br /&gt;
# 6.1 Столбчатая диаграмма для топ-15 слов&lt;br /&gt;
word_counts %&amp;gt;%&lt;br /&gt;
  slice_max(n, n = 15) %&amp;gt;%&lt;br /&gt;
  mutate(word = reorder(word, n)) %&amp;gt;%&lt;br /&gt;
  ggplot(aes(word, n)) +&lt;br /&gt;
  geom_col(fill = &amp;quot;steelblue&amp;quot;) +&lt;br /&gt;
  coord_flip() +&lt;br /&gt;
  labs(&lt;br /&gt;
    title = &amp;quot;Топ-15 слов в Abstract&amp;quot;,&lt;br /&gt;
    x = &amp;quot;Слова&amp;quot;,&lt;br /&gt;
    y = &amp;quot;Частота&amp;quot;&lt;br /&gt;
  ) +&lt;br /&gt;
  theme_minimal()&lt;br /&gt;
&lt;br /&gt;
# 6.2 Гистограмма длины Abstract (в словах)&lt;br /&gt;
# Сначала считаем длину каждого Abstract&lt;br /&gt;
abstract_lengths &amp;lt;- data_selected %&amp;gt;%&lt;br /&gt;
  filter(!is.na(Abstract), Abstract != &amp;quot;&amp;quot;) %&amp;gt;%&lt;br /&gt;
  mutate(word_count = str_count(Abstract, &amp;quot;\\S+&amp;quot;))&lt;br /&gt;
&lt;br /&gt;
ggplot(abstract_lengths, aes(x = word_count)) +&lt;br /&gt;
  geom_histogram(bins = 30, fill = &amp;quot;coral&amp;quot;, alpha = 0.7) +&lt;br /&gt;
  labs(&lt;br /&gt;
    title = &amp;quot;Распределение длины Abstract&amp;quot;,&lt;br /&gt;
    x = &amp;quot;Количество слов в Abstract&amp;quot;,&lt;br /&gt;
    y = &amp;quot;Число документов&amp;quot;&lt;br /&gt;
  ) +&lt;br /&gt;
  theme_minimal()&lt;br /&gt;
&lt;br /&gt;
# 7. АНАЛИЗ N-ГРАММ (биграммы)&lt;br /&gt;
bigrams &amp;lt;- data_selected %&amp;gt;%&lt;br /&gt;
  filter(!is.na(Abstract), Abstract != &amp;quot;&amp;quot;) %&amp;gt;%&lt;br /&gt;
  unnest_tokens(bigram, Abstract, token = &amp;quot;ngrams&amp;quot;, n = 2)&lt;br /&gt;
&lt;br /&gt;
# Разделение биграмм и удаление стоп-слов&lt;br /&gt;
bigrams_separate &amp;lt;- bigrams %&amp;gt;%&lt;br /&gt;
  separate(bigram, into = c(&amp;quot;w1&amp;quot;, &amp;quot;w2&amp;quot;), sep = &amp;quot; &amp;quot;) %&amp;gt;%&lt;br /&gt;
  filter(!w1 %in% get_stopwords()$word,&lt;br /&gt;
         !w2 %in% get_stopwords()$word)&lt;br /&gt;
&lt;br /&gt;
# Подсчет самых частых биграмм&lt;br /&gt;
bigram_counts &amp;lt;- bigrams_separate %&amp;gt;%&lt;br /&gt;
  unite(bigram, w1, w2, sep = &amp;quot; &amp;quot;) %&amp;gt;%&lt;br /&gt;
  count(bigram, sort = TRUE)&lt;br /&gt;
&lt;br /&gt;
head(bigram_counts, 15)&lt;br /&gt;
&lt;br /&gt;
# Визуализация топ-10 биграмм&lt;br /&gt;
bigram_counts %&amp;gt;%&lt;br /&gt;
  slice_max(n, n = 10) %&amp;gt;%&lt;br /&gt;
  mutate(bigram = reorder(bigram, n)) %&amp;gt;%&lt;br /&gt;
  ggplot(aes(bigram, n)) +&lt;br /&gt;
  geom_col(fill = &amp;quot;darkgreen&amp;quot;) +&lt;br /&gt;
  coord_flip() +&lt;br /&gt;
  labs(&lt;br /&gt;
    title = &amp;quot;Топ-10 биграмм в Abstract&amp;quot;,&lt;br /&gt;
    x = &amp;quot;Биграммы&amp;quot;,&lt;br /&gt;
    y = &amp;quot;Частота&amp;quot;&lt;br /&gt;
  ) +&lt;br /&gt;
  theme_minimal()&lt;br /&gt;
&lt;br /&gt;
# ====================================================================&lt;br /&gt;
&amp;lt;/syntaxhighlight&amp;gt;&lt;/div&gt;</summary>
		<author><name>Patarakin</name></author>
	</entry>
</feed>