使用 muut.rb 导入

您好,

运行 muut 的导入脚本时,我遇到了以下错误:

正在导入分类
    2 / 2 (100.0%)  [5170854 项/分钟]   
正在导入讨论
Traceback (most recent call last):
	8: from script/import_scripts/muut.rb:184:in `<main>'
	7: from /var/www/discourse/script/import_scripts/base.rb:47:in `perform'
	6: from script/import_scripts/muut.rb:25:in `execute'
	5: from script/import_scripts/muut.rb:82:in `import_discussions'
	4: from script/import_scripts/muut.rb:82:in `each'
	3: from script/import_scripts/muut.rb:84:in `block in import_discussions'
	2: from script/import_scripts/muut.rb:84:in `each'
	1: from script/import_scripts/muut.rb:110:in `block (2 levels) in import_discussions'
script/import_scripts/muut.rb:162:in `process_muut_post_body': undefined method `gsub!' for nil:NilClass (NoMethodError)

有人能指点我如何绕过这个错误吗?

某些字段(可能是帖子数据)缺失,可能是因为脚本访问了错误的字段名称。

这是一个对我有效的更新 muut.rb:

# frozen_string_literal: true

require "csv"
require File.expand_path(File.dirname(__FILE__) + "/base.rb")

# 编辑常量并初始化您的导入数据。

class ImportScripts::Muut < ImportScripts::Base

  JSON_FILE_PATH = "/path/to/json/file"
  CSV_FILE_PATH = "/path/to/csv/file"

  def initialize
super

@imported_users = load_csv
@imported_json = load_json
  end

  def execute
puts "", "正在从 Muut 导入..."

import_users
import_categories
import_discussions

puts "", "完成"
  end

  def load_json
JSON.parse(repair_json(File.read(JSON_FILE_PATH)))
  end

  def load_csv
CSV.parse(File.read(CSV_FILE_PATH))
  end

  def repair_json(arg)
arg.gsub!(/^\(/, "")     # 文件内容被 ( ) 包围
arg.gsub!(/\)$/, "")

arg.gsub!(/\]\]$/, "]")  # 末尾可能有多余的 ]

arg.gsub!(/\}\{/, "},{") # 有时缺少逗号!

arg.gsub!("}]{", "},{")  # 意外的方括号
arg.gsub!("}[{", "},{")  # :troll:

arg
  end

  def import_users
puts '', "正在导入用户"

create_users(@imported_users) do |u|
  {
    id: u[0],
    email: u[1],
    created_at: Time.now
  }
end
  end

  def import_categories
puts "", "正在导入分类"

create_categories(@imported_json['categories']) do |category|
  {
    id: category['path'], # muut 没有分类 ID,因此使用路径
    name: category['title'],
    slug: category['path']
  }
end
  end

  def import_discussions
puts "", "正在导入讨论"

topics = 0
posts = 0

@imported_json['categories'].each do |category|

  @imported_json['threads'][category['path']].each do |thread|

    next if thread["seed"]["key"] == "skip-this-topic"

    mapped = {}
    mapped[:id] = "#{thread["seed"]["key"]}-#{thread["seed"]["date"]}"

    if thread["seed"]["author"] && user_id_from_imported_user_id(thread["seed"]["author"]["path"]) != ""
      mapped[:user_id] = user_id_from_imported_user_id(thread["seed"]["author"]["path"]) || -1
    else
      mapped[:user_id] = -1
    end

    # 更新用户显示名称
    if thread["seed"]["author"] && thread["seed"]["author"]["displayname"] != "" && mapped[:user_id] != -1
      user = User.find_by(id: mapped[:user_id])
      if user
        user.name = thread["seed"]["author"]["displayname"]
        user.save!
      end
    end

    mapped[:created_at] = Time.zone.at(thread["seed"]["date"])
    mapped[:category] = category_id_from_imported_category_id(thread["seed"]["path"])
    mapped[:title] = CGI.unescapeHTML(thread["seed"]["title"])

    if thread["seed"]["body"] == ""
      thread["seed"]["body"] = " ";
    end
    mapped[:raw] = process_muut_post_body(thread["seed"]["body"])
    mapped[:raw] = CGI.unescapeHTML(thread["seed"]["title"]) if mapped[:raw] == ""

    parent_post = create_post(mapped, mapped[:id])
    unless parent_post.is_a?(Post)
      puts "创建主题 #{mapped[:id]} 时出错。跳过。"
      puts parent_post.inspect
    end

    # 取消注释以下行以创建永久链接
    # Permalink.create(url: "#{thread["seed"]["path"]}:#{thread["seed"]["key"]}", topic_id: parent_post.topic_id)

    # 创建回复
    if thread["replies"].present? && thread["replies"].count > 0
      thread["replies"].reverse_each do |post|

        if post_id_from_imported_post_id(post["id"])
          next # 已导入此帖子
        end

        if post["body"] == ""
          post["body"] = " "
        end

        new_post = create_post({
            id: "#{post["key"]}-#{post["date"]}",
            topic_id: parent_post.topic_id,
            # 修改以下行以从 author/path 值获取唯一的 user_id。
            user_id: user_id_from_imported_user_id(post["author"]["path"]) || -1,
            raw: process_muut_post_body(post["body"]),
            created_at: Time.zone.at(post["date"])
          }, post["id"])

        if new_post.is_a?(Post)
          posts += 1
        else
          puts "创建帖子 #{post["id"]} 时出错。跳过。"
          puts new_post.inspect
        end

      end

    end

    topics += 1
  end
end

puts "", "已导入 #{topics} 个主题,共 #{topics + posts} 篇帖子。"
  end

  def process_muut_post_body(arg)
raw = arg.dup
raw = raw.to_s
raw = raw[0..-1]

# 换行
if raw != nil 
  raw.gsub!(/\\n/, "\n")

# 代码块
  raw.gsub!("---", "```\n")

# 制表符
  raw.gsub!(/\\t/, '  ')

# 双引号
  raw.gsub!(/\\\"/, '"')

  raw = CGI.unescapeHTML(raw)
end
raw
  end

  def file_full_path(relpath)
File.join JSON_FILES_DIR, relpath.split("?").first
  end

end

if __FILE__ == $0
  ImportScripts::Muut.new.perform
end