datatools-server/src/main/java/com/conveyal/datatools/manager/controllers/api/ProjectController.java at d4362dfa1ec8ec9a57d807a0348865339b992eae · ibi-group/datatools-server · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
package com.conveyal.datatools.manager.controllers.api;

import com.conveyal.datatools.common.utils.Scheduler;
import com.conveyal.datatools.common.utils.SparkUtils;
import com.conveyal.datatools.common.utils.aws.S3Utils;
import com.conveyal.datatools.manager.DataManager;
import com.conveyal.datatools.manager.auth.Auth0UserProfile;
import com.conveyal.datatools.manager.jobs.FetchProjectFeedsJob;
import com.conveyal.datatools.manager.jobs.PublishProjectFeedsJob;
import com.conveyal.datatools.manager.jobs.MergeFeedsJob;
import com.conveyal.datatools.manager.models.FeedDownloadToken;
import com.conveyal.datatools.manager.models.FeedRetrievalMethod;
import com.conveyal.datatools.manager.models.FeedSource;
import com.conveyal.datatools.manager.models.FeedVersion;
import com.conveyal.datatools.manager.models.JsonViews;
import com.conveyal.datatools.manager.models.OtpServer;
import com.conveyal.datatools.manager.models.Project;
import com.conveyal.datatools.manager.persistence.Persistence;
import com.conveyal.datatools.manager.utils.JobUtils;
import com.conveyal.datatools.manager.utils.json.JsonManager;
import org.bson.Document;
import org.eclipse.jetty.http.HttpStatus;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import spark.Request;
import spark.Response;

import java.util.Collection;
import java.util.HashSet;
import java.util.Set;
import java.util.stream.Collectors;

import static com.conveyal.datatools.common.utils.SparkUtils.downloadFile;
import static com.conveyal.datatools.common.utils.SparkUtils.formatJobMessage;
import static com.conveyal.datatools.common.utils.SparkUtils.logMessageAndHalt;
import static com.conveyal.datatools.manager.DataManager.publicPath;
import static com.conveyal.datatools.manager.jobs.feedmerge.MergeFeedsType.REGIONAL;
import static spark.Spark.delete;
import static spark.Spark.get;
import static spark.Spark.post;
import static spark.Spark.put;

/**
 * Handlers for HTTP API requests that affect Projects.
 * These methods are mapped to API endpoints by Spark.
 * TODO we could probably have one generic controller for all data types, and use path elements from the URL to route to different typed persistence instances.
 */
@SuppressWarnings({"unused", "ThrowableNotThrown"})
public class ProjectController {
    private static final Logger LOG = LoggerFactory.getLogger(ProjectController.class);

    /**
     * @return a list of all projects that are public or visible given the current user and organization.
     */
    private static Collection<Project> getAllProjects(Request req, Response res) {
        Auth0UserProfile userProfile = req.attribute("user");
        // TODO: move this filtering into database query to reduce traffic / memory
        return Persistence.projects.getAll().stream()
                .filter(p -> req.pathInfo().matches(publicPath) || userProfile.hasProject(p.id, p.organizationId))
                .map(p -> checkProjectPermissions(req, p, "view"))
                .collect(Collectors.toList());
    }

    /**
     * @return a Project object for the UUID included in the request.
     */
    private static Project getProject(Request req, Response res) {
        return requestProjectById(req, "view");
    }

    /**
     * Create a new Project and store it, setting fields according to the JSON in the request body.
     * @return the newly created Project with all the supplied fields, as it appears in the database.
     */
    private static Project createProject(Request req, Response res) {
        // TODO error handling when request is bogus
        // TODO factor out user profile fetching, permissions checks etc.
        Auth0UserProfile userProfile = req.attribute("user");
        Document newProjectFields = Document.parse(req.body());
        String organizationId = (String) newProjectFields.get("organizationId");
        boolean allowedToCreate = userProfile.canAdministerApplication() || userProfile.canAdministerOrganization(organizationId);
        // Data manager can operate without organizations for now, so we (hackishly/insecurely) deactivate permissions here
        if (organizationId == null) allowedToCreate = true;
        if (allowedToCreate) {
            Project newlyStoredProject = Persistence.projects.create(req.body());
            Scheduler.handleAutoFeedFetch(newlyStoredProject);
            return newlyStoredProject;
        } else {
            logMessageAndHalt(req, 403, "Not authorized to create a project on organization " + organizationId);
            return null;
        }
    }

    /**
     * Update fields in the Project with the given UUID. The fields to be updated are supplied as JSON in the request
     * body.
     * @return the Project as it appears in the database after the update.
     */
    private static Project updateProject(Request req, Response res) {
        // Fetch the project once to check permissions
        requestProjectById(req, "manage");
        try {
            String id = req.params("id");
            Document updateDocument = Document.parse(req.body());
            Project updatedProject = Persistence.projects.update(id, req.body());
            // Catch updates to auto-fetch params, and update the autofetch schedule accordingly.
            // TODO factor out into generic update hooks, or at least separate method
            Scheduler.handleAutoFeedFetch(updatedProject);
            return updatedProject;
        } catch (Exception e) {
            logMessageAndHalt(req, 500, "Error updating project", e);
            return null;
        }
    }

    /**
     * Delete the project for the UUID given in the request.
     */
    private static Project deleteProject(Request req, Response res) {
        // Fetch project first to check permissions, and so we can return the deleted project after deletion.
        Project project = requestProjectById(req, "manage");
        project.delete();
        return project;
    }

    /**
     * Manually fetch a feed all feeds in the project as a one-off operation, when the user clicks a button to request it.
     */
    private static String fetch(Request req, Response res) {
        Auth0UserProfile userProfile = req.attribute("user");
        Project p = requestProjectById(req, "manage");
        FetchProjectFeedsJob fetchProjectFeedsJob = new FetchProjectFeedsJob(p, userProfile);
        // This job is runnable because sometimes we schedule the task for a later time, but here we call it immediately
        // because it is short lived and just cues up more work.
        fetchProjectFeedsJob.run();
        return SparkUtils.formatJobMessage(fetchProjectFeedsJob.jobId, "Fetching all project feeds...");
    }

    /**
     * Public helper function that returns the requested object if the user has permissions for the specified action.
     * FIXME why can't we do this checking by passing in the project ID rather than the whole request?
     * FIXME: eliminate all stringly typed variables (action)
     * @param req spark Request object from API request
     * @param action action type (either "view" or "manage")
     * @return requested project
     */
    private static Project requestProjectById (Request req, String action) {
        String id = req.params("id");
        if (id == null) {
            logMessageAndHalt(req, 400, "Please specify id param");
        }
        return checkProjectPermissions(req, Persistence.projects.getById(id), action);
    }

    /**
     * Given a project object, this checks the user's permissions to take some specific action on it.
     * If the user does not have permission the Spark request is halted with an error.
     * TODO: remove all Spark halt calls from data manipulation functions, API implementation is leaking into data model
     * If the user does have permission we return the same project object that was input, but with the feedSources nulled out.
     * In the special case that the user is not logged in and is therefore only looking at public objects, the feed
     * sources list is replaced with one that only contains publicly visible feed sources.
     * This is because the UI only uses Project objects with embedded feedSources in the landing page, nowhere else.
     * That fetch with embedded feedSources should be done with something like GraphQL generating multiple backend
     * fetches, not with a field that's only populated and returned in special cases.
     * FIXME: this is a method with side effects and no clear single purpose, in terms of transformation of input to output.
     */
    private static Project checkProjectPermissions(Request req, Project project, String action) {
        Auth0UserProfile userProfile = req.attribute("user");
        // Check if request was made by a user that is not logged in
        boolean publicFilter = req.pathInfo().matches(publicPath);

        // check for null project
        if (project == null) {
            logMessageAndHalt(req, 400, "Project ID does not exist");
            return null;
        }

        boolean authorized;
        boolean isAdmin = userProfile.canAdministerProject(project);
        switch (action) {
            // TODO: limit create action to app/org admins? see code currently in createProject.
//            case "create":
//                authorized = userProfile.canAdministerOrganization(p.organizationId);
//                break;
            case "manage":
                authorized = isAdmin;
                break;
            case "view":
                // request only authorized if not via public path and user can view
                authorized = !publicFilter && userProfile.hasProject(project.id, project.organizationId);
                break;
            default:
                authorized = false;
                break;
        }

        // Filter labels
        project.labels = project.retrieveProjectLabels(isAdmin);


        // If the user is not logged in, include only public feed sources
        if (publicFilter){
            project.feedSources = project.retrieveProjectFeedSources().stream()
                    .filter(fs -> fs.isPublic)
                    .collect(Collectors.toList());
        } else {
            project.feedSources = null;
            if (!authorized) {
                logMessageAndHalt(req, 403, "User not authorized to perform action on project");
                return null;
            }
        }
        // if we make it here, user has permission and this is a valid project.
        return project;
    }

    /**
     * HTTP endpoint to initialize a merge project feeds operation. Client should check the job status endpoint for the
     * completion of merge project feeds job. On successful completion of the job, the client should make a GET request
     * to getFeedDownloadCredentials with the project ID to obtain either temporary S3 credentials or a download token
     * (depending on application configuration "application.data.use_s3_storage") to download the zip file.
     */
    static String mergeProjectFeeds(Request req, Response res) {
        Project project = requestProjectById(req, "view");
        Auth0UserProfile userProfile = req.attribute("user");
        if (!userProfile.canAdministerProject(project.id)) {
            logMessageAndHalt(req, HttpStatus.UNAUTHORIZED_401, "Must be a project admin to merge project feeds.");
        }
        Set<FeedVersion> feedVersions = new HashSet<>();
        // Get latest version for each feed source in project
        Collection<FeedSource> feedSources = project.retrieveProjectFeedSources();
        for (FeedSource feedSource : feedSources) {
            if (feedSource.retrievalMethod.equals(FeedRetrievalMethod.REGIONAL_MERGE)) {
                LOG.warn("Skipping {} feed source because it contains the regionally merged feed.", feedSource.name);
                continue;
            }
            // Check if feed version exists.
            // TODO: check that version passes baseline validation checks?
            FeedVersion version = feedSource.retrieveLatest();
            if (version == null) {
                LOG.warn("Skipping {} because it has no feed versions", feedSource.name);
                continue;
            }
            LOG.info("Adding {} feed to merged zip", feedSource.name);
            feedVersions.add(version);
        }
        // Check that the latest regionally merged feed does not already contain input feed versions.
        if (project.regionalFeedSourceId != null) {
            Set<String> versionIds = feedVersions.stream().map(FeedVersion::retrieveId).collect(Collectors.toSet());
            // Check that latest merged feed version is not a copy of what has already been merged.
            FeedSource regionalFeedSource = Persistence.feedSources.getById(project.regionalFeedSourceId);
            if (regionalFeedSource != null) {
                FeedVersion latest = regionalFeedSource.retrieveLatest();
                if (latest != null && latest.inputVersions.equals(versionIds)) {
                    logMessageAndHalt(
                        req,
                        HttpStatus.BAD_REQUEST_400,
                        "Merge feeds job aborted. Regional merge already exists for latest feed versions found in project."
                        );
                }
            }
        }
        MergeFeedsJob mergeFeedsJob = new MergeFeedsJob(userProfile, feedVersions, project.id, REGIONAL);
        JobUtils.heavyExecutor.execute(mergeFeedsJob);
        // Return job ID to requester for monitoring job status.
        return formatJobMessage(mergeFeedsJob.jobId, "Merge operation is processing.");
    }

    /**
     * Returns credentials that a client may use to then download a feed version. Functionality
     * changes depending on whether application.data.use_s3_storage config property is true.
     */
    private static Object getFeedDownloadCredentials(Request req, Response res) {
        Project project = requestProjectById(req, "view");

        // if storing feeds on s3, return temporary s3 credentials for that zip file
        if (DataManager.useS3) {
            // Return presigned download link if using S3.
            String key = String.format("project/%s.zip", project.id);
            return S3Utils.downloadObject(S3Utils.DEFAULT_BUCKET, key, false, req, res);
        } else {
            // when feeds are stored locally, single-use download token will still be used
            FeedDownloadToken token = new FeedDownloadToken(project);
            Persistence.tokens.create(token);
            return token;
        }
    }

    /**
     * Copy all the latest feed versions for all public feed sources in this project to a bucket on S3.
     * Updates the index.html document that serves as a listing of those objects on S3.
     * This is often referred to as "deploying" the project.
     */
    private static String publishPublicFeeds(Request req, Response res) {
        Auth0UserProfile userProfile = req.attribute("user");
        String id = req.params("id");
        if (id == null) {
            logMessageAndHalt(req, 400, "must provide project id!");
        }
        Project p = Persistence.projects.getById(id);
        if (p == null) {
            logMessageAndHalt(req, 400, "no such project!");
        }
        // Run as lightweight job.
        PublishProjectFeedsJob publishProjectFeedsJob = new PublishProjectFeedsJob(p, userProfile);
        JobUtils.lightExecutor.execute(publishProjectFeedsJob);
        return formatJobMessage(publishProjectFeedsJob.jobId, "Publishing public feeds");
    }

    /**
     * Spark endpoint to synchronize this project's feed sources with another website or service that maintains an
     * index of GTFS data. This action is triggered manually by a UI button and for now never happens automatically.
     * An ExternalFeedResource of the specified type must be present in DataManager.feedResources
     */
    private static Project thirdPartySync(Request req, Response res) {
        Auth0UserProfile userProfile = req.attribute("user");
        String id = req.params("id");
        Project proj = Persistence.projects.getById(id);

        String syncType = req.params("type");

        if (!userProfile.canAdministerProject(proj)) {
            logMessageAndHalt(req, 403, "Third-party sync not permitted for user.");
        }

        LOG.info("syncing with third party " + syncType);
        if(DataManager.feedResources.containsKey(syncType)) {
            try {
                DataManager.feedResources.get(syncType).importFeedsForProject(proj, req.headers("Authorization"));
            } catch (Exception e) {
                logMessageAndHalt(req, 500, "An error occurred while trying to sync", e);
            }
            return proj;
        }

        logMessageAndHalt(req, 404, syncType + " sync type not enabled for application.");
        return null;
    }

    /**
     * This connects all the above HTTP API handlers to URL paths (registers them with the Spark framework).
     * A bit too static/global for an OO language, but that's how Spark works.
     */
    public static void register (String apiPrefix) {
        // Construct JSON managers which help serialize the response. Slim JSON is the generic JSON view. Full JSON
        // contains additional fields (at the moment just #OtpServerWithoutEc2Instances) and should only be used when the controller
        // returns a single project (slimJson is better suited for a collection). If fullJson is attempted for use
        // with a collection, massive performance issues will ensue (mainly due to multiple calls to AWS EC2).
        JsonManager<Project> slimJson = new JsonManager<>(Project.class, JsonViews.UserInterface.class);
        JsonManager<Project> fullJson = new JsonManager<>(Project.class, JsonViews.UserInterface.class);
        fullJson.addMixin(Project.class, Project.ProjectWithOtpServers.class);
        fullJson.addMixin(OtpServer.class, OtpServer.OtpServerWithoutEc2Instances.class);
        slimJson.addMixin(Project.class, Project.ProjectWithOtpServers.class);

        get(apiPrefix + "secure/project/:id", ProjectController::getProject, fullJson::write);
        get(apiPrefix + "secure/project", ProjectController::getAllProjects, slimJson::write);
        post(apiPrefix + "secure/project", ProjectController::createProject, fullJson::write);
        put(apiPrefix + "secure/project/:id", ProjectController::updateProject, fullJson::write);
        delete(apiPrefix + "secure/project/:id", ProjectController::deleteProject, fullJson::write);
        get(apiPrefix + "secure/project/:id/thirdPartySync/:type", ProjectController::thirdPartySync, fullJson::write);
        post(apiPrefix + "secure/project/:id/fetch", ProjectController::fetch, fullJson::write);
        post(apiPrefix + "secure/project/:id/deployPublic", ProjectController::publishPublicFeeds, fullJson::write);

        get(apiPrefix + "secure/project/:id/download", ProjectController::mergeProjectFeeds);
        get(apiPrefix + "secure/project/:id/downloadtoken", ProjectController::getFeedDownloadCredentials, fullJson::write);

        get(apiPrefix + "public/project/:id", ProjectController::getProject, fullJson::write);
        get(apiPrefix + "public/project", ProjectController::getAllProjects, slimJson::write);
        get(apiPrefix + "downloadprojectfeed/:token", ProjectController::downloadMergedFeedWithToken);
    }

    /**
     * HTTP endpoint that allows the requester to download a merged project feeds file stored locally (it should only
     * be invoked if the application is not using S3 storage) given that the requester supplies a valid token.
     */
    private static Object downloadMergedFeedWithToken(Request req, Response res) {
        FeedDownloadToken token = Persistence.tokens.getById(req.params("token"));

        if(token == null || !token.isValid()) {
            logMessageAndHalt(req, 400, "Feed download token not valid");
        }

        Project project = token.retrieveProject();

        Persistence.tokens.removeById(token.id);
        String fileName = project.id + ".zip";
        return downloadFile(FeedVersion.feedStore.getFeed(fileName), fileName, req, res);
    }

}