mirror of
https://github.com/discourse/discourse.git
synced 2025-01-22 23:26:15 +08:00
30990006a9
This reduces chances of errors where consumers of strings mutate inputs and reduces memory usage of the app. Test suite passes now, but there may be some stuff left, so we will run a few sites on a branch prior to merging
79 lines
2.5 KiB
Ruby
79 lines
2.5 KiB
Ruby
# frozen_string_literal: true
|
|
|
|
class IncomingLinkNormalization < ActiveRecord::Migration[4.2]
|
|
def up
|
|
remove_column :incoming_links, :post_number
|
|
remove_column :incoming_links, :domain
|
|
add_column :incoming_links, :incoming_referer_id, :integer
|
|
|
|
create_table :incoming_referers do |t|
|
|
t.string :url, limit: 1000, null: false
|
|
t.string :domain, limit: 100, null: false
|
|
t.string :path, limit: 1000, null: false
|
|
t.integer :port, null: false
|
|
t.boolean :https, null: false
|
|
t.integer :incoming_domain_id
|
|
end
|
|
|
|
# start the shuffle
|
|
#
|
|
execute "INSERT INTO incoming_referers(url, https, domain, port, path)
|
|
SELECT referer,
|
|
CASE WHEN a[1] = 's' THEN true ELSE false END,
|
|
a[2] as domain,
|
|
CASE WHEN a[1] = 's' THEN
|
|
COALESCE(a[4]::integer, 443)::integer
|
|
ELSE
|
|
COALESCE(a[4]::integer, 80)::integer
|
|
END,
|
|
COALESCE(a[5], '') path
|
|
FROM
|
|
(
|
|
SELECT referer, regexp_matches(referer, 'http(s)?://([^/:]+)(:(\d+))?(.*)') a
|
|
FROM
|
|
(
|
|
SELECT DISTINCT referer
|
|
FROM incoming_links WHERE referer ~ '^https?://.+'
|
|
) Z
|
|
) X
|
|
WHERE a[2] IS NOT NULL"
|
|
|
|
execute "UPDATE incoming_links l
|
|
SET incoming_referer_id = r.id
|
|
FROM incoming_referers r
|
|
WHERE r.url = l.referer"
|
|
|
|
create_table :incoming_domains do |t|
|
|
t.string :name, limit: 100, null: false
|
|
t.boolean :https, null: false, default: false
|
|
t.integer :port, null: false
|
|
end
|
|
|
|
# shuffle part 2
|
|
#
|
|
execute "INSERT INTO incoming_domains(name, port, https)
|
|
SELECT DISTINCT domain, port, https
|
|
FROM incoming_referers"
|
|
|
|
execute "UPDATE incoming_referers l
|
|
SET incoming_domain_id = d.id
|
|
FROM incoming_domains d
|
|
WHERE d.name = l.domain AND d.https = l.https AND d.port = l.port"
|
|
|
|
remove_column :incoming_referers, :domain
|
|
remove_column :incoming_referers, :port
|
|
remove_column :incoming_referers, :https
|
|
|
|
change_column :incoming_referers, :incoming_domain_id, :integer, null: false
|
|
|
|
add_index :incoming_referers, [:path, :incoming_domain_id], unique: true
|
|
add_index :incoming_domains, [:name, :https, :port], unique: true
|
|
|
|
remove_column :incoming_links, :referer
|
|
end
|
|
|
|
def down
|
|
raise ActiveRecord::IrreversibleMigration
|
|
end
|
|
end
|