require './spec/support/sidekiq_middleware' class Gitlab::Seeder::Projects include ActionView::Helpers::NumberHelper PROJECT_URLS = %w[ https://gitlab.com/gitlab-org/gitlab-test.git https://gitlab.com/gitlab-org/gitlab-shell.git https://gitlab.com/gnuwget/wget2.git https://gitlab.com/Commit451/LabCoat.git https://github.com/jashkenas/underscore.git https://github.com/flightjs/flight.git https://github.com/twitter/typeahead.js.git https://github.com/h5bp/html5-boilerplate.git https://github.com/google/material-design-lite.git https://github.com/jlevy/the-art-of-command-line.git https://github.com/FreeCodeCamp/freecodecamp.git https://github.com/google/deepdream.git https://github.com/jtleek/datasharing.git https://github.com/WebAssembly/design.git https://github.com/airbnb/javascript.git https://github.com/tessalt/echo-chamber-js.git https://github.com/atom/atom.git https://github.com/mattermost/mattermost-server.git https://github.com/purifycss/purifycss.git https://github.com/facebook/nuclide.git https://github.com/wbkd/awesome-d3.git https://github.com/kilimchoi/engineering-blogs.git https://github.com/gilbarbara/logos.git https://github.com/reduxjs/redux.git https://github.com/awslabs/s2n.git https://github.com/arkency/reactjs_koans.git https://github.com/twbs/bootstrap.git https://github.com/chjj/ttystudio.git https://github.com/MostlyAdequate/mostly-adequate-guide.git https://github.com/octocat/Spoon-Knife.git https://github.com/opencontainers/runc.git https://github.com/googlesamples/android-topeka.git ] LARGE_PROJECT_URLS = %w[ https://github.com/torvalds/linux.git https://gitlab.gnome.org/GNOME/gimp.git https://gitlab.gnome.org/GNOME/gnome-mud.git https://gitlab.com/fdroid/fdroidclient.git https://gitlab.com/inkscape/inkscape.git https://github.com/gnachman/iTerm2.git ] # Consider altering MASS_USERS_COUNT for less # users with projects. MASS_PROJECTS_COUNT_PER_USER = { private: 3, # 3m projects + internal: 1, # 1m projects + public: 1 # 1m projects = 5m total } def seed! Sidekiq::Testing.inline! do create_real_projects! create_large_projects! create_mass_projects! end end private def create_real_projects! # You can specify how many projects you need during seed execution size = ENV['SIZE'].present? ? ENV['SIZE'].to_i : 8 PROJECT_URLS.first(size).each_with_index do |url, i| create_real_project!(url, force_latest_storage: i.even?) end end def create_large_projects! return unless ENV['LARGE_PROJECTS'].present? LARGE_PROJECT_URLS.each(&method(:create_real_project!)) if ENV['FORK'].present? puts "\nGenerating forks" project_name = ENV['FORK'] == 'true' ? 'torvalds/linux' : ENV['FORK'] project = Project.find_by_full_path(project_name) User.offset(1).first(5).each do |user| new_project = ::Projects::ForkService.new(project, user).execute if new_project.valid? && (new_project.valid_repo? || new_project.import_state.scheduled?) print '.' else new_project.errors.full_messages.each do |error| puts "#{new_project.full_path}: #{error}" end print 'F' end end end end def create_real_project!(url, force_latest_storage: false) group_path, project_path = url.split('/')[-2..-1] group = Group.find_by(path: group_path) unless group group = Group.new( name: group_path.titleize, path: group_path ) group.description = FFaker::Lorem.sentence group.save! group.add_owner(User.first) end project_path.gsub!(".git", "") params = { import_url: url, namespace_id: group.id, name: project_path.titleize, description: FFaker::Lorem.sentence, visibility_level: Gitlab::VisibilityLevel.values.sample, skip_disk_validation: true } if force_latest_storage params[:storage_version] = Project::LATEST_STORAGE_VERSION end project = nil Sidekiq::Worker.skipping_transaction_check do project = ::Projects::CreateService.new(User.first, params).execute # Seed-Fu runs this entire fixture in a transaction, so the `after_commit` # hook won't run until after the fixture is loaded. That is too late # since the Sidekiq::Testing block has already exited. Force clearing # the `after_commit` queue to ensure the job is run now. project.send(:_run_after_commit_queue) project.import_state.send(:_run_after_commit_queue) # Expire repository cache after import to ensure # valid_repo? call below returns a correct answer project.repository.expire_all_method_caches end if project.valid? && project.valid_repo? print '.' else puts project.errors.full_messages print 'F' end end def create_mass_projects! projects_per_user_count = MASS_PROJECTS_COUNT_PER_USER.values.sum visibility_per_user = ['private'] * MASS_PROJECTS_COUNT_PER_USER.fetch(:private) + ['internal'] * MASS_PROJECTS_COUNT_PER_USER.fetch(:internal) + ['public'] * MASS_PROJECTS_COUNT_PER_USER.fetch(:public) visibility_level_per_user = visibility_per_user.map { |visibility| Gitlab::VisibilityLevel.level_value(visibility) } visibility_per_user = visibility_per_user.join(',') visibility_level_per_user = visibility_level_per_user.join(',') Gitlab::Seeder.with_mass_insert(User.count * projects_per_user_count, "Projects and relations") do ActiveRecord::Base.connection.execute <<~SQL INSERT INTO projects (name, path, creator_id, namespace_id, visibility_level, created_at, updated_at) SELECT 'Seed project ' || seq || ' ' || ('{#{visibility_per_user}}'::text[])[seq] AS project_name, '#{Gitlab::Seeder::MASS_INSERT_PROJECT_START}' || ('{#{visibility_per_user}}'::text[])[seq] || '_' || seq AS project_path, u.id AS user_id, n.id AS namespace_id, ('{#{visibility_level_per_user}}'::int[])[seq] AS visibility_level, NOW() AS created_at, NOW() AS updated_at FROM users u CROSS JOIN generate_series(1, #{projects_per_user_count}) AS seq JOIN namespaces n ON n.owner_id=u.id SQL ActiveRecord::Base.connection.execute <<~SQL INSERT INTO project_features (project_id, merge_requests_access_level, issues_access_level, wiki_access_level, pages_access_level) SELECT id, #{ProjectFeature::ENABLED} AS merge_requests_access_level, #{ProjectFeature::ENABLED} AS issues_access_level, #{ProjectFeature::ENABLED} AS wiki_access_level, #{ProjectFeature::ENABLED} AS pages_access_level FROM projects ON CONFLICT (project_id) DO NOTHING; SQL ActiveRecord::Base.connection.execute <<~SQL INSERT INTO routes (source_id, source_type, name, path) SELECT p.id, 'Project', u.name || ' / ' || p.name, u.username || '/' || p.path FROM projects p JOIN users u ON u.id=p.creator_id ON CONFLICT (source_type, source_id) DO NOTHING; SQL end end end Gitlab::Seeder.quiet do projects = Gitlab::Seeder::Projects.new projects.seed! end